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D D DUO Tera un 
D E] SLIPD] D D D 0 0 
D D D D 
BSDI O00 
D D 2.0(199D[] Net/2 N 
I000000000 
4.4BSD-Lite(1994) 
00000 Neva D 
01-1 0000 TCP/IPD 0000 BSD[] D 
4. 4BSD-Litel] ODO! Net/3 
U. C. Berkeley 0 0000 TCP/IP 
U u u U u u 
[] [] SunOS 4.x V 
A(SVRA)[] AIX 3.2 TCP/IP 
U U U 
1-1 0 10 O 1982[] [| 4.1cBSDO O U 
1983 4.2BSD 
4.1cBSD BSD TCP/IP Bolt Beranek and 
Newman(BBN)[] Rob Gurwitz[] Jack Haverty [Salus 1994] 18000 
4.2BSD[] [| BBN]] TCP/IP] O O | 0 
Ballistics[] Mike Muuss[] PDP-11 TCP/IP 0 
i L 0 O [Karels and 
McKusick 1986] 4.2BSD[] 4.3BSD [Jacobson 1990d][] 0 [| I 
4.3BSD Tahoe[] 4.3BSD Reno[] [| 
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XTI[] TLI 
Net/3( BSD ) 
TCP/IP Unix TLI 
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1 /* 

2 * Send a UDP datagram to the daytime server on some other host, 
3 * read the reply, and print the time and date on the server. 

4 */ 


5 #include <sys/types.h> 
6 #include <sys/socket.h> 
7 #include <netinet/in.h> 
8 #include <arpa/inet.h> 
9 #include <stdio.h> 
10 #include <stdlib.h> 
11 #include <string.h> 
12 #define BUFFSIZE 150 /* arbitrary size */ 
13 int 
14 main() 
15 ( 
16 struct sockaddr_in serv; 
17 char buff [BUFFSIZE]; 
18 int sockfd, n; 
19 if ((sockfd = socket (PF INET, SOCK_DGRAM, 0)) < 0) 
20 err_sys("socket error"); 
21 bzero((char *) &serv, sizeof(serv)); 
22 serv.sin_family = AF_INET; 
23 serv.sin addr.s addr = inet_addr("140.252.1.32"); 
24 serv.sin_port = htons(13); 
25 if (sendto(sockfd, buff, BUFFSIZE, 0, 
26 (struct sockaddr *) &serv, sizeof(serv)) != BUFFSIZE) 
27 err_sys("sendto error"); 
28 if ((n = recvfrom(sockfd, buff, BUFFSIZE, 0, 
29 (struct sockaddr *) NULL, (int *) NULL)) < 2) 
30 err_sys("recvfrom error"); 
31 buff[n - 2] = 0; /* null terminate */ 
32 printf("%s\n", buff); 
33 exit (0); 
34 ) 
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SVR4 socket open 
/dev/udp sockmod sendto 
putmsg recvfrom getmsg SVR 4 
API 
Net/1 send[] sendto 
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socket 
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v-node Unix 
socket Internet 
socket 
a.out 
( 0) ( 1) 2) 1-5 
Net/3 oL 1 
socket 3 
socket 
p_fd filedesc 































































































































































































Chi a*pUbecom i 9 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































fd ofileflags ( ) 
fd ofiles 8 bit 
close-on-exec mapped-from-device 
0 
Unix 
proc{} ` Char[] 
[0]: 0 
filedesc() [1]: 0 
p_fd [2]: 0 
[3]: 0 
fd ofileflags 
fd ofiles 
*fileOTl 
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soo_select | fo_select 
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inp laddr inp. laddr so pcb 
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inp socket inp. socket 
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node — 
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fileops 
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socket DTYPE SOCKET file 
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file file file socket 
socket inpcb 
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. mbufj (m ext.ext buf) (m ext.ext size) 
2048 m datallm ext.ext buf ( 
) m data | m ext | ext free 
Net/3 
° m next[] mbu ( ) mbuf 1-8 
. m_nextpkt ( ) mbuf| 
mbu mbuf| mbuf 
mbu | mbu m nextpkt m 
mbu m nextpkt 
2-2 1-8 
UDP ( 14 mbu 
IP ) TCP 1460 TCP 
mbuf| IP[] TCP 
(m data) 
Net/3 M EXT mbu 
m ext mbuf pkthdr 
UDP mbu MT DATA TCP 
mbu MT HEADER UDP[] TCP 
mbuf 
mbuf[] m flags M PKTHDR 
mbu (Net/3 mbu 2-1) 
Net/1 mbu [Leffler et al. 1989[] p.290] Net/2 
m flags m act m nextpkt 
mbu 
mbu UDP[] TCP UDP M PREPEND 
([] 23-15 23.1)[] TCP MGETHDR([] 26-25) 
22 [III 
mbu C mbu mbuf| 
2-3 
Oo U Oo U 
sys/mbuf.h mbuf[] 00 mbut DO D 
kern/uipc mbuf.c mbuf]] H 
023 0000000 
2.2.1 HH 






































































































































28 


TCP/IP 2 




























































































China-pub.com 











0 H 


0000 


o d 


mba 0000 ( 2-9) 


024 00000000 











































































































































































































































































































































































































































































































































































































222 
mbstat 2-5 
mbstat[] ] [] [] 
m clfree DO 
m clusters U DDD DDD D 
m_drain U D D D D dan] D D D DD 0 0 0 0 
m_drops OOOO (0 010 0 00 0 
m mbufs U D D (0 D 10 000 mburi) 
m_mtypes[256] [] U mbuff [1 E] 00 MT xxx[] O 
m spare D D DD (00) 
m wait OOOO (100100 
02-5 000 mbstat JO OO mbuf]] O 
netstat -m 2-6 
clusters (34[] m clfree (32) —— (DU m clusters(34) 
mbuf (99x 128 ) (34x 2048 
) 1024 mbu (99x 128 ) (2x 2048 
(80 ) 100 





































































































netstat -m output mbstat member 


99 mbufs in use: 
1 mbufs allocated to data 
43 mbufs allocated to packet headers 


17 mbufs allocated to protocol control blocks 
20 mbufs allocated to socket names and addresses 


18 mbufs allocated to socket ee 
2/34 mapped pages in use 
80 Kbytes allocated to network (208. in use) 
0 requests for memory denied 
0 requests for memory delayed 
0 calls to protocol drain routines 
































3 
o 
u 
A 
° 
+ 

NA 





0 2-6 mbuf[] DO O 


m_mtypes [MT DATA) 
m_mtypes (MT, HEADER) 
m mtypes[MT PCB] 

m mtypes[MT SONAME] 
m mtypes [MT SOOPTS] 
(see text) 

(see text) 

m drops 

m wait 

m drain 





Net/3 




















































































































































































































( netstat 
























































































































































































































































































































































/dev/mem 














































































































































































































China-pubıcoN 29 



























































































































































































































































































































































































































































































































































2.3 mbuff ID 
mbu 2-7 MCLBYTES 
/usr/include/machine/param.h mbuf.h 
MCLBYTES 2048 DO mbu) 0000000 
MHLEN 100 U D D 0 D D mg 00000 
MINCLSIZE 208 00000000000 
MLEN 108 U D D meuf] D 0 B D UD 
MSIZE 128 O O mbuf] 0 O 
0 2-7 mbuf.h [| [| mbuf[] O 


2.4 mbuf[] [| 

















2-8 mbuf 

































































FE mbuf.h 
60 /* header at beginning of each mbuf: */ 


61 struct m hdr ( 


62 struct mbuf *mh next; /* next buffer in chain */ 

63 struct mbuf *mh nextpkt; /* next chain in queue/record */ 
64 int mh len; /* amount of data in this mbuf */ 
65 caddr t mh data; /* pointer to data */ 

66 short mh type; /* type of data (Figure 2.10) */ 
67 short mh flags; /* flags (Figure 2.9) */ 

68 ); 


69 /* record/packet header in first mbuf of chain; valid if M PKTHDR set */ 
70 struct pkthdr ( 


71 int len; /* total packet length */ 
72 struct ifnet *rcvif; /* receive interface */ 
73 Y; 


74 /* description of external storage mapped into mbuf, valid if M EXT set */ 
75 struct m ext { 


76 caddr t ext buf; /* start of buffer */ 

77 void (*ext free) (); /* free routine if not the usual */ 
78 u int ext size; /* size of buffer, for ext free */ 
79 1; 

80 struct mbuf ( 

81 struct m hdr m hdr; 

82 union ( 

83 struct ( 

84 struct pkthdr MH pkthdr; /* M PKTHDR set */ 

85 union { 

86 struct m ext MH ext; /* M EXT set */ 

87 char MH databuf [MHLEN] ;. 

88 ) MH dat; 

89 ) MH; 

90 char M databuf [MLEN] ; /* IM PKTHDR, !M EXT */ 

91 ) M dat; 

92 Y; 


O 2-8 mof [] [J 












































30 TCP/IP 2 China+pub.Com 
— — 0 ill 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































93 #define m next m hdr.mh next 
94 #define m len m hdr.mh len 
95 #define m data m hdr.mh data 
96 #define m type m hdr.mh type 
97 #define m flags m hdr.mh flags 
98 #define m nextpkt m hdr.mh nextpkt 
99 #define m act m nextpkt 
100 #define m pkthdr M dat.MH.MH, pkthdr 
101 #define m ext M dat.MH.MH dat.MH ext 
102 #define m pktdat M dat.MH.MH dat.MH databuf 
103 #define m dat M, dat.M databuf 
M ——————————————————— MULT 
02-8 (0) 
mbuf m hdr 
M PKTHDR|| M EXT 
93-103 11[] #define mbuf 
Net/3 
mbuf m next[] mbuf 
mbuf| m nextpkt[| mbu mbu 
1-8 mbu m len m pkthdr.len 
mbu m len 
2-9 m flags 
m flags [] U 
M BCAST O000000007/00 
M EOR U D D 0 
M_EXT 0 mubf[] ID (OO00 ) 
M MCAST O000000007/00 
M PKTHDR U U DU D U D (000000 meuf 
M COPYFLAGS M PKTHDR/M EOR/M BCAST/M MCAST 
[] 2-9 m flags |] 
M_EXT|| M_PKTHDR|| M EOR mbuf 
Internet ( TCP) TCP 
OSI[] XNS 
mubf| M_BCAST|| M_MCAST 
( 1-3) 
M_COPYFLAGS mbuf 
2-10 MT_xxx m_type mbu 
mbuf mbu 
1-6 mbuf| 
sendto m_type MT_SONAME 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2-10 mbuf Net/3 (MT HTABLE) 
TCP/IP MT_OOBDATA OSI[] XNS 
TCP (out-of-band) ( [] 29.7 ) | 
mbuf| 
Mbuf m type O O Net/3 TCP/IP[] O [] O Hat 
MT CONTROL . 0200000090 M MBUF 
MT DATA . BUB M MBUF 
MT FREE 000000 M_FREE 
MT_FTABLE ° But M FTABLE 
MT HEADER . n, UO m M MBUF 
MT HTABLE IMPO DO M HTABLE 
MT IFADDR Hogg M_IFADDR 
MT_OOBDATA HO (0000 M_MBUF 
MT_PCB DB M PCB 
MT RIGHTS uut M MBUF 
MT RTABLE Ooo M_RTABLE 
MT_SONAME . 000 M MBUF 
MT SOOPTS . Hood M_SOOPTS 
MT_SOCKET Hood M_SOCKET 
02-10 DO mtyee D D 
M xxx) mbuf] 
60[] [] M xxx | malloc MALLOC | 
2-6 netstat —m[] mbu MT xxx 
vmstat -M M xxx 
mbu (128 ) mbu — 
108 Net/3 mbu TCP ( 24 
) mbuf MT_PCB 4. 4BSD | 108 
140 
2-10 MT PCB mbuf| 2-6 
Unix mbu mbuf| 
Internet 
2.5 000 mbuff ood 
mbuf( mbuf mbuf ) 
M 
" 2 < 
C L ) 
( ) 
























































































































































































































































































































































3 ar China-pubıcom 
—— — EE 


2.5.1 m get 


































































































































































































2-11 mbu m get MGET 




















uipc_mbuf.c 
134 struct mbuf * 
135 m_get (nowait, type) 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































136 int nowait, type; 
137 I 
138 struct mbuf *m; 
139 MGET (m, nowait, type); 
140 return (m); 
141 } š 
uipc_mbuf.c 
0 2-11 mge 0000000 mbuf 
Net/3 ANSIC ANSIC 
Net/3 ANSIC <sys/mbuf.h> 
struct mbuf *m_get (int, int); 
nowait M WAIT[| M DONTWAIT 
mbuf sendto ([] 1-6) 
M WAIT 
mbu ([] 1-10) M DONTWAIT 
mbuf 
2.5.2 MGET 
2-12 MGET MGET sendto ([] 1-6) 
mbu 
MGET (m, M WAIT, MT SONAME); 
if (m == NULL) 
return (ENOBUFS); 
154 #define MGET(m, how, type) { \ mbuf.h 
155 MALLOC((m), struct mbuf +, MSIZE, mbtypes[type], (how)); \ 
156 if (m) ( Ó 
157 (m)-»m type = (type); \ 
158 MBUFLOCK (mbstat.m mtypes[type]-*;) V 
159 (m)-»m next = (struct mbuf *)NULL; \ 
160 (m)-»m nextpkt = (struct mbuf *)NULL; \ 
161 (m)-»m data = (m)-»m dat; \ 
162 (m)-»m flags = 0; \ 
163 ) else \ 
164 (m) = m retry((how), (type)); \ 








China pubscom EN 33 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































M WAIT 2-13 mbu 
154-157 MGET MALLOC 
mbtypes[] mbuf[] MT xxx M xxx[] ([] 2-10) m type 
158 mbu I(mbstat) MBUFLOCK 
(U 1-13) mbstat.m_ 
mtypes [type] ++ mbu 
C ++ (1) (2) 1] (3) 
770 0) MGET 10 2 
78) MGET mbufl 
(77) 1(78) MGET 3 
(78) 79 78 
159-160 mbu m next[| m_nextpkt 
mbu 
161-162 108 mbu 0 
163-164 m retry([] 2-13) M WAIT 
M DONTWAIT 
2.5.8 m retry 
2-13 m retry 
uipc mbuf.c 


92 struct mbuf * 
93 m retry(i, t) 

































































































































































































































































































































































































































































































































































































































































































































































94 int i, tt 
95 I 
96 Struct mbuf *m; 
97 m reclaim(); 
98 #define m retry(i, t) (struct mbuf *)0 
99 MGET(m, i, t); 
100 #undef m retry 
101 return (m); 
102 } e 
uipc_mbuf.c 
02-13 m retry U U 
92-97 m_retry m_reclaim 7.4 
" drain” m reclaim 10-32 
IP[] drain IP IP TCP[] drain 
UDP drain 
98-102 m_reclaim 
MGET mbuf| MGET([] 2-12) m retry 
MGET m 
m retry MGET m retry 








































































































































































































China-pubecom 





3 4 TCP/IP 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2 
MGET 
2.5.4 mbufl] 
spl 2-12 MBUFLOCK 
MALLOC splimp splx 
MFR mbu 
mbu MCLALLOC|| MCLFREE splimp splx 
MGET 
m get spl 
2.6 m devget[] m_pullup|]| |] 
IP[] ICMP[] IGMP[] UDP[] TCP m_pullup 
( ) mbuf 
mbuf m_pullup 
m_devget mtod|| dtom 

































































Net/3[] mbu 














2.6.1 m devget[] 

















































































































































































































































































































































































































































































































m devget mbuf 
( ) 4 
mbuf 2-14 
mbuf () mbuf () 
m_next NULL 
m_nextpkt NULL 
m_len 52 
m_data 
m_type MT_DATA 
m_flags M_PKTHDR M_PKTHDR 
m pkthdr.len 52 m pkthdr.len 85 


m pkthdr.rcvif ptr 


2000 
(O IPD O 




















oOo 
SE 






m pkthdr.rcvif |ptr 














gef D DD ss 85< 000 <100 


O 2-14 mdevget 000000000 mbuf 


Chi a-bubıcoM 


mbuf {} 
m_len 


m_pkthdr.len 


m pkthdr.rcvif 

















101<0 0 0 0 207 


O 2-15 m_devget 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































1) I 2-14 mbuf| 0-84 
52 
20 IP 32 
TCP ( 20 TCP 
12 TCP ) TCP 
m devget mbuf IP 
m len 28[] 20 IP 
8 UDP 0 UDP 
m_devget mbuf 16 
14 
14 
mbuf 
icmp reflect 
tcp respond mbuf 
mbuf 
84 
16 
16 
14 mbuf 
IP 
2) 85-100 
mbu 16 


























































































































35 






































20 mbufl 











000000 mbuf 























DIDO 


0000 30 mbuf 


mbuf {} 


m_nextpkt 









MT. DATA 

M PKTHDR|M EXT 
m pkthdr.len 1500 

ptr 

NULL 


m ext.ext size 












208x [1 000 < 2048 
20480 0 O 








O 2-16 m devget 000040 mbuf 


T 


36 





CP/IP 





























China-pub.tom 







































































































































































85 





























3) 




























































































101-207 




































































mbuf) 


















































































































































mbuf 






















































































devget 






























































208 



































































































































1500 




































































































































































mbu 

















EXT 






















































































2.6.2 mtod| 














dtom | 














mtod 



































dtom 





mbuf.h 
























































mbu 

















#define 
#define 


mtod(“ 




















mbu 


mtod(m,t) 
dtom (x) 


((t) ( 
( (struct mbuf *) ((i 


(m)->m data)) 














nt) (x) & ^(MSIZE-1))) 



































”) 























mbu 




















































































































struct mbuf *m; 
struct ip *ip; 


ip 
ip->ip_v 


mtod (m, 


struct ip 
IPVERSION; 





mbu 








(m_data) 

















SI 





































































































ip 




































































C ( 
























































mbu 



































mbuf] ( 














2-14 








2-15) 





AN 


2-16) 



































dtom (“ 











mbuf” ) 








































































































































































































buf 


























































































































ip 











mbu 


















































struct mbuf *m; 
struct ip *ip; 


m = dtom(ip); 








mbuf 




























































































MSIZE(128) 


















































mbuf] 























MSIZE 


















































dtom 





























mbu 















































dtom 








































































































































































































mbuf 


























dtom 
































































































































m_pullup 





2.6.3 m pullup 








m pullup 





































































































(IP[] ICMP[] I 














GMP 








UDP 












































mbuf 


























(m_len) 






































( IP 





























20 











UDP 























20) 





























m_pullup 


































































































































































































37 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































20 mbufl 
m_pullup mbuf| N mbuf N 
100 (MHLEN) N 
mbuf mtod[] dtom 
IP 
if (m->m len < sizeof (struct ip) ££ 
(m = m_pullup(m, sizeof(struct ip))) == 0) { 
ipstat.ips_toosmall++; 
goto next; 
å = mtod(m, struct ip +); 
mbu 200 IP JU m pullup m pullup 
(1) mbuf| MGET (2) mbuf 
( N| 20) 
m pullup IP| 1 IP 
mbuf 20 
m_pullup ( C && mbu 
) 2-14-[] 2-16 
mbuf| IP| 100 
60 IP 40 TCP ( — — ICMP[] IGMP 
UDP—— 40 ) mbuf| ( 
) mbuf| 
(m len ) m pullup mbuf| 
MPFail m pullup 
1 Net/3 2700 IP MPFail 9 
ipstat.ips_toosmall 9 (ICMP[] IGMP[] UDP 
TCP[] ) m_pullup 0 m_pullup 
IP 
2.6.4 m_pullup|] IP 
m_pullup IPL] TCP IP 296 
IP IP mbuf| 
2-16 mbuf[] 296 2- 
17 
IP IP IP 
( IP 
10 ) TP 
2-17 IP 
( ) mbuf 
m_data dtom mbuf IP 











































































































































































































38 





































































































































































































































































































































































































































































































































































































































































































China-pub.com 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
2-17 
mbuf () 
m next NULL 
m nextpkt NULL 
m len 296 
m data 
m type MT DATA 
m flags M PKTHDR|M EXT 
m pkthdr.len 296 
m pkthdr.rcvif ptr 
m ext.ext buf 
m ext.ext free|NULL 
m ext.ext size|2048 
. HUU TI: ers IU DD 
0000 El] 0000 
IP hdr 
2760 0000 
20480 0 0 
02-17 00000 290 PO O 
IP 
m pullup 20 IP mbu 
if (m->m_flags & M_EXT) { 
if ((m = m_pullup(m, sizeof(struct ip))) == 0) I 
ipstat.ips_toosmall++; 
goto next; 
} 
ip = mtod(m, struct ip *); 
} 
2-18 m_pullup mbuf m_pullup 
mubf 40 mbuf 40 | 
20 IP ( ICMP[] IGMP 
UDP[] TCP) 40([] 7-17 max protohdr) 
20 IP 20 TCP ( 
OSI ) 
2-18 IP mbuf IP 
dtom mbuf] 























































































































































































m_pkthdr.len 296 


m_pkthdr.rcvif |pir 
IPO O 


00000200 U 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































20480 000 
02-18 DO mpatie JO 000 2960 PI O 
265 TCP m_pullup 
TCP m_pullup m_pullup 
mbu TCP 
1 19 TCP ( 512 
) ( 90% 10 ) 
TCP[] IP 2-14 ( 
mbu ) 2-16 ( ) TCP 
TCP IP IP 
TCP IP IP 
mbu (U 2-17) 
27.9 TCP[] mbu TCP 
mbu m pullup 
IP mbu ([] 2-18) dtom 
IP| 27.9 
tcp reass 














































































































40 






































China-bubscom 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP| 20 U 
2.6.6 m pullup |] | 
uut | m pullupl 
e U D D D 0 D U D D D U D U IP U 0 D D U D U D mb IE | L u 
000000 uu (IP[] ICMP[] IGMP[] UDP[] TCP)[] [| O m_pulluel ll Ú 
OOOO00Om euiiug[ IO 0 U D IP D D U 0 D D U m eurrupl UU 0 l] 
0 OM 1 
«GO O O IPU ID [| IP DOODODODO m_pullupl| U U lll 
000000 U U D U U D D meul lup D D D 0 UD D 0 D 0 OD 208000 
e00 TCPO LPU D 0 0 U TC PD D D 0 U U 0000000000 
m pullup [O U O O IPO TCP[] ID LH LU Ú 
2.7 mbuf 0 000090 
U U U mbuf[f] D H D 0 H B] 0000219000 l 2200 D] EL 00000 2-190 [| 
U U #define 
U U mbuff DUU L l U U U U 0 U L LU U U U U U U U LU L 
[] mbuf[] [] | up Net] Hii U i Hi UU B B. U D] D] D] U LUJ U U LU U U U L 
0000000000 
U p 0 
MCLGET DU D DDD (0 D 000 D WOM D D mbat 0 D D DD (mdata0 000000 
DU DDD DDD DDD 0 DD D 0 D D mbuf OM ExTU O 
void MCLGET (struct mbuf * m, int nowait) ; 
MFREE O000=000m9f00»%J0000G00MmMEx0D0O00000000000000 
O0000000000000000000 00 2.90 DD 10 DD œD DD (U m 
-»m next[][][] (] 0 D D 0000 a0 
void MFREE (struct mbuf *m, struct mbuf *n); 
MGETHDR U D D D mbu DD 0 D DD 0 D D D D D D 0 D D DD verd 2-120 00000 
000 x exrgpRD D H D D D 0 Gata D D D 0 D D D 0 D 10000000 
void MGETHDR (struct mbuf * m, int nowait, int type); 
MH_ALIGN U D D D D D D D D D D mbuff] m data] O00 mbuf 0 D D D 0 D 0 D DDD len 
O000000000000000000000000 
void MH ALIGN (struct mbuf zm, int len); 
M PREPEND 0 m0 D D mbt] D D 0 D 0 D 0 ent] D 0 D 0 D U D meuf] 0 D D DD 0 D Um sata) 
[] len] 000000 Gi ren D fen] D D D D D 0 D D D 0 D D D D D D D D D mbufl 
(Om next[] D D D 0 D ml] D D D mbufl] D D D D 0 m D D D Depu D D D D D 0 0 D 
U D rent] D 0 D D D D D D 0 mbufl] D D (CI D Ü J O Mmari D D D D mb O00 
DU D D D 0 mu D D D D D 0 D D D D D D D DUDU D mu D D  mbuff] 
void M_PREPEND (struct mbuf *m, int len, int nowait); 
dtom DU D D D 0 mbu D D D D D D D D D D 0 D D D D D D 0 D mbut 0 D 0 D 0 D 
struct mbuf *dtom(void *x); 
mtod DU mD D D mburi D D D D D D D 0 D D D rype] O 
type mtod(struct mbuf nt, type); 














02-19 9000000000 mbuti 


Chi à*büf Co 020 mo 00000 41 











U DU 0 HU 


m_adj U "D D D mbpu£[] D D ent) D D D 0 DD D eeQ DD D D D 0 D D 0 D DDD U 
mbuf[] D D D zen] D D D 0 D D D D D D mb O00 ee D D D D D U 


void m_adj(struct mbuf *m, int len); 

















m_cat 007000 mbu 0 0 0 D D mD D D mutQ 0 0 0 D D 0 D D D 0 POOO (0 10 
U JD 000000 
void m_cat (struct mbuf *m, struct mbuf *n); 
m_copy Om copyrn D 0 D D D 0 0 DU D 0 4000000 M_DONTWAIT 
struct mbuf * m_copy (struct mbuf *m, int offset, int len); 
m_copydata U "D D D mbufl] D O00 en) 0 0 0 0 D cg 0 D D D DU mbuli D D 0 0 D DU 


offset] 0 D D D D 


void m copydata(struct mbuf *m, int offset, int len, caddr_t cp); 


m_copyback Dol D D 0 D DU len 000000000 mbufl] 00000 mbut) 0 E D 
offset] D D D D D D D mbut 0 0 D 0 0 0 mbufl] UU 


void m_copyback (struct mbuf *m, int offset, int len, caddr_t cp); 


m_copym 000000 mb D D 0 D mO D D mu D D D D offset] D D 12000000 
OO mbufl] DD 0 00 D 0000000000 eni DB M corraLtL] god 
mbuf] 00 offse 0 D D 0 D D 0 D D 0 D UD 2970000000000000 














Ooo 


struct mbuf *m_copym(struct mbuf *m, int offset, int len, int nowait) ; 


m_devget 0000000000 mbfG D D D D 0 D D 0 D D D D D D D D D D D D D D le 
revif] 00000 leuD (pD D D D D cop] D D D D (02007100000 mb O 
OO cop) D 0 0 DDD D DDD peopvD D D D 0 D D D D 0 0 0 eff 00 0 0 U 
2600000000 


struct mbuf *m_devget (char *buf, int len, int off, struct ifnet *ifp, 











void (*copy) (const void *, void +, u int)); 





m_free [] {FREED OOOO 


struct mbuf *m_free(struct mbuf *m); 











m freem OO m7 D D 000000 mbuf 
void m_freem(struct mbuf * m); 
m_get met] 000000002-020000000 
struct mbuf *m get (int nowait, int type); 
m getclr 000000 meri 0000 meu D D 1080000000 


struct mbuf *m_getclr (int nowait, int type); 





m_gethdr [] MGETHDR[I OOOO 
struct mbuf *m_gethdr (int nowait, int type); 


U 0 D D 0 D D D mbu D D D D D 0 D len D 0 D D D 0 D 0 D 0 0 D 0 0 D U 
O mbu) D D D D 0 D 0 D 0 mod D D 0 D 0 D 0 0 D D 0 DD ent) O00 
U DD 2.60 000 0000 

struct mbuf m pullup(struct mbuf nf, int len); 


02-20 0000000000 mbull] O 


000000 0 nowaitf] M wArT[] M_DONTWAIT[] O [| type] [| 2-100 [ O O MT xxx[] 
U U U U 





m_pullup 
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2 
M PREPEND 1-7 1-8 IP[] UDP 
mbu ( 1-8 
2-2) mbu 
M copydata caddr t š Y 
«sys/types.h» char * 
mmap 4.4BSD[] SVR4 
caddr_t 
2.8 Net/3[] I 000000 
Net/3 Net/3 
( <sys/queue.h>) 
1) mbu m next mbu 
2) mbuf mbu mbuf| m nextpkt 
2-21 
sockbuf{} mbuf() mbuf() . 
= NULL 
NULL 
mbuf{} mbuf () mbuf {} 
m_next NULL 
m_nextpkt m_nextpkt m_nextpkt |NULL 
02-21 000000 mbuf[] D D D 
mbuf mbu 
UDP 
TCP ( mbuf 
mbuf) 
mbuf mbuf 
m_next mbu mbuf| 
m nextpkt 
3) mbu 
2-22 ([] 3-13) 2-2 
2-21 
4) 


















































Chinaspubscom T 43 




























































m next 
m nextpkt 


0222 100000000090 
2-23 IP (U 10[] ) (U 220 ) 














































































































































































































TCP ( 27.90 > 


































































































mbuf —— 












































































































































































































































































































































next previous 


























next[] previous 


































































































































































































































































































































































































































































































insque[] remque([] 10-20) 


2.9 m copy] JU D] D U 

























































































































































































































































































































































































































































































































































































mbu 
10[] mbu 1024 mbuf| 100 8 
108 60 10[] mbufi 
1024 mbuf 
(2048 + 128)[] 2176 1280 10 (10x 128) 
mbu TCP m_copy 














































































































































































































































































































44 
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TCP/IP 2 
write 4096 TCP 
4096 2048 
TCP mbuf] 
2-24 tcp output socket! sockbuf 
mbu so snd.sb mb 
socket () mbuft} 
NULL 
Imnextpke Je 
m len 2048 
|n type |MT DATA 
M PKTHDR |M EXT 
m_pkthdr.len 2048 
fm_pkthar. reviF NULL 
[m ext -ext_free | NULL 
m ext.ext size|2048 
20480 00 
20480 D000 
0 2-24 0 0 20480) 00070000 0000 
( ) TCP (MSS)[] 1460|] tcp. output 
1460 IP[] TCP mbuf 
(16 ) mbu IP mbuf 
2-25 
1.9 UDP UDP[] mbu mbu 
IP UDP mbuf TCP 
TCP 
tcp output m_copy 1460 
m_copy mbuf([] 2-25 ) 
( ) mbu 
1460 588 mbuf 1514 
IP TCP 
2-25 mbuf| 
mbu m_copy mbu mbuf| 
mbuf mbuf 





























China=pupecom 255 45 




























































































































































































m pkthdr.len 
























































2048 
socket () mbuf() 

m next NULL 
m nextpkt NULL 

so snd.sb mb m len 2048 
m data 
m type MT DATA 
m flags M PKTHDR |M EXT 


m_pkthdr.len 12048 

m pkthdr.rcvif|NULL 
TCP[] DO Ú m ext.ext buf 

m ext.ext free|NULL 

m ext.ext size|2048 









































20480 0 0 
20480 D000 
mbuf () mbuf () 
> m next NULL 
m nextpkt NULL 
m len m len 1460 
m data 
MT HEADER m type MT DATA 
M. PKTHDR m flags M PKTHDR|M EXT 
m pkthdr.len 1514 m pkthdr.len 2048 


















































































































































































































































































































































































































































[00000 Im pkthår.revif | NULL m pkthdr.rcvif NULL 
TCPO OO ER mme m ext.ext buf 
00000 Te ot Free NULL 

U U m ext.ext size| 2048 
02-25 TCPO O O0 0 0 0 DD 0 00 000 0-0 0 
mbuf mbuf[] —— 
mbuf 1 
1 0 
( 2.4) 
2-25 mbuf 
m_freem mbu 


















































































































































































































































46 oao 0 China-pub.tom 
AA tgeg 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































mbu 1 1 
TCP 
socket () mbuf {} mbuf {} 
m_next m_next NULL 
m_nextpkt NULL m_nextpkt NULL 
so_snd.sb_mb m_len 2048 m_len 2048 
m_data m_data 
m_type MT_DATA m_type MT_DATA 
m_flags M-EKTHDR l m_flags e RER | 
m pkthdr.len 2048 m pkthdr.len 2048 
m pkthdr.rcvif|NULL m pkthdr.rcvif|NULL 
m ext.ext buf m ext.ext buf 
m ext.ext free|NULL m ext.ext free|NULL 
m ext.ext size|2048 m ext.ext size|2048 
2048[] OM 2048[] OM 
146000000 
20800000 
5889 0000 
mbuf {} mbuf() | mbuf {} 
m next m next NULL 
m_nextpkt NULL m_nextpkt NULL m_nextpkt NULL 
m_len 54 m_len 588 m_len 872 
m data m data 
MT HEADER |m type MT DATA m type MT DATA 
M PKTHDR m flags M EXT m flags M EXT 
m pkthdr.len 1514 
m pkthd cvif 
m ext.ext buf m ext.ext buf 
m ext.ext free|NULL m ext.ext free|NULL 
m ext.ext size|2048 m ext.ext size|2048 
02-26 DUU 14600 0 TCPO O 00 mbuf] 
588 tcp output 
1460 IP ( 26 tcp output 
) 2048 
mbu TCP mbuf) 



















































































































































































































































































tcp output 1460 mbu 











































































































20 mbufl 
































47 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































m_copy 1460 (1460 
2-26 mbu ( mbu 
IP TCP ) 
1460 588 872 
mbuf 1460 m_copy 1460 
2-26 mbuf 
m_copy mbuf 
mbu sosend 
m copy 
210 0000 
mbuf] | 
Van Jacobson [Partridge 1993] Internet 
mbuf [Jacobson 1993] 
mbu 
mbuf| 
mbu VAX-11/780[] 4 
mbu mbu [Hutchinson and Peterson 1991] mbu 
2.11 00 
mbuf 
mbuf| 
M PKTHDR|| M EXT 4 mbu 
e mbu 0-108 
. mbu 0-100 
N L ) 
° ( ) 
mbuf] mbu 2-19 2-20 
mbuf] 
m devget 



































































































































































































































48 
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TCP/IP 2[] | 
U m_pullupl | | U O mbuf 

mbuf ( OO) m_copy TCP 

U U OU OU U U | U U 
0 U 0 U 

U U 
2.1 2-9 M COPYFLAGS M_EXT 
2.2 2.6 m_pullup | 
(IOB) 
2.3 O U dr om 2.6 0 —— 0 
| O mbuf[] E] E] E] I] L] 
2.4 mbuf 0 20 0 ( [] 1024[] 2048) | LU L] 
Net/3 U ( B) 

2.5 [] 2-50 o m drops[] m wait O O mbufi 









































































































































































































































































































































































































































































































































































































































































































































ipsu tt 


O30 U D U 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































o DB 
Net/3 i 
(U U ) 
Net/3 
. ut 
(best-effort) 
Net/3 
1) AMD 7990 LANCE 
2) [] [] IP(SLIP) U uuu U uuu 
3) l U U U U 00000 
3.2 [JD D D] 
| U EL U C 
C 8 3-1 
[] [] [] [] 
sys/socket.h 000000 
net/if.h 000000 
net/if dl.h 0000000 
kern/init_main.c 0200000090 
net/if.c 000000 
net/if loop.c 00000000 
net/if_sl.c SEP 000090 
hp300/dev/if le.c LANCE Hj H B B B B 0 ü 





























031 0000000 





3.2.1 [ u 




















3-2 





































































































50 


TCP/IP| 














2| 











China-pub.com 








































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































pdevinit struct pdevinit[] DU DD SLP 0 0 D 0 D 000 0 D 0 U 
ifnet struct ifnet * ifnet] 0000000 
ifnet addrs struct ifaddr **| JO00O00000000000 
if_indexlim int O [] ifnet_addrs] [I 0 
if_index int OO0OO0000000 
ifqmaxlen int 0000000000 
hz int paga d0000 (0/0) 
132 DDD DB D IJ D D: D Ú 
3.2.2 SNMP| 
Ne/3 I 0000000000000000000000000 Hd U U u 
000000000000 (SNMP MIB-ID[ OOO TCP/IP[] 00000000 
[| U RFC 1213 [McCloghrie and Rose 1991][] SNMP MIB-II O 03-30 DD 10 
SNMP[] 0 U 
System 000000 
Interfaces 000000 
Address Translation O000000000000G0000) 
IP IPD D D Ú 
ICMP ICMPO 0 ] Ü 
TCP TCP) OOO 
UDP UDPO DUDU 
EGP EGPO O O D 
Transmission 000000 
SNMP SNMPI OOO 
O 3-3 MIB-II[] O SNMP[] 
Net/3[] 0 SNMP ||] D Net/3[] SNMP{] D O l U T OM 
UUOUSNMPJ D 000 2201| LU LU U U U D U U U U U 0 U 
Net/30 7 000 MIB-11[] UU [| SNMP uti Lu uL Lu LLL 
MIB-II[] D (1) OM 
(2) 000 (3) 0 
L LU U U U U 
ISODE O [| Net/3 SNMP[] [] [] ISODE|] [| O B| 
U 34] 000 SNMP] O 00000000 U U DD 47000 SNMP[] 
LU U U 
SNMP[ D Net/3Q O o D 
ifNumber if index + 1 if_indexJ TOOO0O00G000000000000 
U 00 D 10000000000 ifNumber 
034 000000000005 MPE 









































3.3 ifnet|] |] 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ifnet 
ifnet ifnet 
3-5 
3-5 3 ifaddr 
Internet[] OSI 
Internet ifaddr() 
OSI ([] 3-5 ) = 
ifnet ([] 3-5 03-5 DDimet [0 000 
) ifar D D 0 0 D 
Net/3 
Internet 
Net/2 
IP 
ifnet 
. 
. 
. 
. 
. 
3-6 ifnet 
ifh 
80 struct ifnet { 
81 struct ifnet *if_next; /* all struct ifnets are chained */ 
82 struct ifaddr *if_addrlist; /* linked list of addresses per if */ 
83 char *if_name; /* name, e.g. ‘le’ or ‘lo’ */ 
84 short if_unit; /* sub-unit for lower level driver */ 
85 u_short if_index; /* numeric abbreviation for this if */ 
86 short if_flags; /* Figure 3.7 */ 
87 short if_timer; /* time ‘til if watchdog called */ 
88 int if_pcount; /* number of promiscuous listeners */ 
89 caddr_t if bpf; /* packet filter structure */ ifh 
If. 
0 3-6 ifnet [] L] D] 1] HI] D] L] 
80-82 if next ifnet if attach 
if addrlist ifaddr (U 3-16) 
ifaddr 
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83-86 if name[] 00000 if unit) D D 0 
SLIP 0 0 if name 0 OD" si" 
[] if unit [| if unit[] 0 [] O 1[] if index 
sysctl|] ( 19.14] 5[] O 0 
| | | | SLIP 0 
IP[] E] H EL E] E]. H] if index 00000060 
if flags | 
70 “ |” 4.4 SIOCGIFFLAGS 
SIOCSIFFLAGS 
if_flags 0000 [] [] 
IFF BROADCAST . 000000 
IFF_MULTICAST . 000000 
IFF POINTOPOINT . DU DD DDD DD 
IFF_LOOPBACK DOOOOODOO 
IFF_OACTIVE . 000000 
IFF_RUNNING . 0000000000 
IFF_SIMPLEX . 000000000000 090 
IFF_LINKO 000 0000000000 
IFF LINKI 000 OOO000000 
IFF LINK2 000 NDODODOODDND 
IFF_ALLMULTI 000000000090 
IFF_DEBUG DOOOOOOO 
IFF_NOARP 0000000000 ARPD O 
IFF_NOTRAILERS DOOOOODOO 
IFF_PROMISC O000000000 
IFF UP OOO000 
[ 3-7 if flags |] 
IFF BROADCAST[] IFF POINTOPOINT 
IFF CANTCHANGE[] " "OO U 
“ P ” L 
(IFF. LINKx)| O | 
| 3-29 SLIP 
2. 
87 if_timer if_watchdog 
u! u u 
3. BSD 
88-89 if pcount[| if bpf BSD (BPF) BPF 
Hu U 
BPF[] [| BPF 31100 
ifnet UDO DO DD 3-8 HOUddUO 
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ifh 
90 struct if_data { 
91 /* generic interface information */ 
92 u_char ifi_type; /* Figure 3.9 */ 
93 u_char ifi, addrlen; /* media address length */ 
94 u char ifi hdrlen; /* media header length */ 
95 u long ifi mtu; /* maximum transmission unit */ 
96 u long ifi_metric; /* routing metric (external only) */ 
97 u long ifi, baudrate; /* linespeed */ 
138 #define if mtu if data.ifi mtu 
139 #define if, type if data.ifi type 


140 #define if addrlen if data.ifi addrlen 
141 #define if hdrlen if data.ifi hdrlen 
142 #define if metric if data.ifi, metric 


143 #define if baudrate if data.ifi baudrate fh 
m———————————————————————— — if. 


0 3-8 ifmet JI00000 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Net/3 138[] -143 #define ifnet 
4. 
90-92 if_type 3-9 net/if_types.h 
if_type 
if_type U U 
IFT OTHER OOo 
IFT_ETHER 000 
IFT_ISO88023 IEEE 802.30 9 O (CSMA/CD) 
IFT_ISO88025 IEEE 802.59 00 
IFT FDDI O0O0000000 
IFT LOOP D 0 0 0 
IFT SLIP 000 IP 
134 if 000000 
93-94 if addrlen if hdrlen 
6 14 (O 4-8) 
95 if_mtu 
1500 
96-97 if_metric 0 if_baudrate 
SLIP 
3-10 ifnet 
5. 
98-111 












































































































































































































































































































































if collisions[]l[] if noproto 
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IP OSI ) IP SLIP 









































































































































































































































if noprotol]l 











ifh 


98 /* volatile statistics */ 


99 u long ifi ipackets; /* #packets received on interface */ 
100 u_long ifi_ierrors; /* #input errors on interface */ 

101 u_long ifi_opackets; /* #packets sent on interface */ 

102 u long ifi, oerrors; /* #output errors on interface */ 

103 u long ifi collisions; /* #collisions on csma interfaces */ 
104 u long ifi ibytes; /* #bytes received */ 

105 u long ifi obytes; /* #bytes sent */ 

106 u long ifi, imcasts; /* #packets received via multicast */ 
107 u long ifi omcasts; /* #packets sent via multicast */ 

108 u long ifi iqdrops; /* #packets dropped on input, for this 
109 interface */ 
110 u long ifi noproto; /* #packets destined for unsupported 
111 protocol */ 

112 struct timeval ifi lastchange; /* last updated */ 
113 ) if data; 





144 #define if ipackets if data.ifi ipackets 

145 #define if ierrors if data.ifi ierrors 

146 #define if opackets if data.ifi opackets 

147 #define if oerrors if data.ifi oerrors 

148 #define if, collisions if data.ifi collisions 
149 #define if ibytes if data.ifi ibytes 

150 #define if obytes if data.ifi obytes 

151 #define if imcasts if data.ifi imcasts 

152 #define if omcasts if data.ifi omcasts 

153 #define if iqdrops if data.ifi igdrops 

154 #define if noproto if_data.ifi_noproto 

155 #define if lastchange if data.ifi lastchange 





ifh 


03-10 OO ifmet DUDUD 

















































































































































































































































































































































































































































































































Net/1 ifnet 
SNMP MIB-II 
if_iqdrops SLIP IF_DROP SLIP 
if snd.ifq drops (U 3-13)[] 1 SNMP 
ifq_drops BSD ISODE SNMP if_iqdrops 
if_snd.ifq_drops 























6. 
112-113 if_lastchange 






























































































































































Net/3 144 155 #define ifnet 

























































































































































































ifnet 3-11 
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ifh 
114 /* procedure handles */ 
115 int (*if_init) /* init routine */ 
116 (int); 
117 int (*if_output) /* output routine (enqueue) */ 
118 (struct ifnet *, struct mbuf *, struct sockaddr *, 
119 struct rtentry *); : 
120 int (*if start) /* initiate output routine */ 
121 (struct ifnet *); 
122 int (*if done) /* output complete routine */ 
123 (struct ifnet *); /* (XXX not used; fake prototype) */ 
124 int (fif ioctl) /* ioctl routine */ 
125 (struct ifnet *, int, caddr t); 
126 int (*if reset) 
127 (int); /* new autoconfig will permit removal */ 
128 int (*if watchdog) /* timer routine */ 
129 (int); A 
ifh 
03-11 OU ifnet [] [I D [I D€ 
7. 
114-129 ifnet 7 
3-12 
Net/3 /* XXX * 
if done 
Net/3 
0 E 0 E 
if init 00000 
if output O0O00000000000 
if start OOO0000 
if done OOO00000 dn» 
if ioctl U D vorn D D 0 
if reset D D DOD 
if watchdog 000000 
g 3-12 00 ifnet [] D LH Ll Ú 
4 SLIP ifnet 
ifp ifnet 
(*ifp->if start) (ifp) 
if start 
ifnet 3-13 
130-137 if snd ifnet 
ifq head ( )] ifq tail 
if len ifq maxlen 
50( ifqmaxlen 
IFQ MAXLEN ) mbuf ifq drops 
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TCP/IP 2H I 
Uli L 3-14| L LU | | 
- ifh 
130 struct ifqueue ( 
131 struct mbuf *ifg head; 
132 Struct mbuf *ifq tail; 
133 int ifq len; /* current length of queue */ 
134 int ifg maxlen; /* maximum length of queue */ 
135 int ifq drops; /* packets dropped because of full queue */ 
136 ) if snd; /* output queue */ q 
137 3; š 
if.h 
03-13 0 O ifnet [] D] LH] Ú Ú 
0 E 0 E 
IF_QFULL fa D ü 
int IF QFULL(struct ifqueue *ifq); 
IF DROP IF DROP) D D #000 ifa drops] 10 D DDD 0 D D D D 0 000 D DOD 0 0 
void IF DROP (struct ifqueue *ifq); 
IF_ENQUEUE D D D mp D D f0 000000000 mbufl] O00 m_nextext0 0000 
void IF_ENQUEUE (struct ifqueue *ifq, struct mbuf *m); 
IF_PREPEND D D D mI] DD 00000 
void IF_PREPEND (struct ifqueue *ifq, struct mbuf *m); 
IF_DEQUEUE ¿00000000000 »000000000000000»-=000 
void IF_DEQUEUE (struct ifqueue *ifq, struct mbuf *m); 
if qflush O000740000000000000000000 
void if gflush(struct ifqueueifd); 
[] 3-14 fiqueue [] [] 
50 O O net/if.h Ol | if qflush[)[] net/if.c 
i 0 | | 
s = splimp(); 


if (IF QFULL(inq)) { 


IF DROP(inq); 


m freem(m); 





/* queue is full, drop new packet */ 























































































































































































































































































































































































































) eise 

IF ENQUEUE (ing, m); /* there is room, add to end of queue */ 
splx(s); 

E uut 0 E IF DROP[] ifq drops[l 19 0 0 

TCP (U) UDP)[] Í 
splimp[| splx u 
splx m freem[] O [] mbuf [| splimp 
m_freem [| splx m_freem (2.5) 



























































































































































Chinaspubecow 57 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































3.4 ifaddr[] [| 
ifaddr 3-15 
ifaddr 
ifaddr 
TCP/IP Net/3 
TCP/IP 
ifh 
217 struct ifaddr { 
218 struct ifaddr *ifa next; /* next address for interface */ 
219 struct ifnet tifa ifp; /* back-pointer to interface */ 
220 struct sockaddr *ifa addr; /* address of interface */ 
221 struct sockaddr “ifa dstaddr; /* other end of p-to-p link */ 
222 #define ifa broadaddr ifa dstaddr /* broadcast address interface */ 
223 struct sockaddr *ifa netmask; /* used to determine subnet */ 
224 void (*ifa_rtrequest) (); /* check or clean routes */ 
225 u_short ifa_flags; /* mostly rt_flags for cloning */ 
226 short ifa_refcnt; /* references to this structure */ 
227 int ifa_metric; /* cost for this interface */ 
228 }; 
ifh 
03-15 [O [] ifaddr 
217-219 ifaddr ifa next ifnet{} 
eee »000000 
if_addrlist 
ifnet ifa_ifp 3-16 
ifnet||ifaddr 
































































































































































































































































































































































































































































































































220 ifa addr 
ifa netmask 
| 
ifa_addr r 
1 

0 sockaddr __tfaddrt} 
(3.50 X 0 3-38 
IP IP! 
221-223 ifa_dstaddr( 
ifa_broadaddr) 















































































































































































































































































































































































































































































































































( ) ifnet 
IFF BROADCAST[|| IFF POINTOPOINT D 3-16 DD ifnet H ifaddr 
(U 3-7) 
224-228 ifa rtrequest||ifa flags|]ifa metric 
ifa refcnt ifaddr IFAFREE 0 
SIOCDIFADDRioctl ifaddr 
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TCP/IP 2 
ifaddr IFAFREE 1 
IFAFREE ifafree 
3.5 sockaddr[| |] 
Net/3 sockaddr 
3-17 BSD — osockaddr 3-18 
t. 
120 struct sockaddr ( ioc 
121 u_char sa len; /* total length */ 
122 u char sa family; /*. address family (Figure 3.19) */ 
123 char sa data[14]; /* actually longer; address value */ 
124 ); 
271 struct osockaddr ( 
272 u short sa, family; /* address family (Figure 3.19) */ 
273 char sa data[14]; /* up to 14 bytes of direct address */ 
274 ); 
socket.h 
03-17 [][] sockaddr [| osockaddr 
family 
sockaddr() Be | 
1 1 140 0 
2 140 0 
[] 3-18 [] [| sockaddr [| osockaddr( 00000 sa) 
sa 
1. Sockaddr 
120-124 Net/3 sockaddr 
sa len (OSI[] Unix sa family 
3-19 (address family) 
AF UNSPEC sockaddr 
sa len sa family sockaddr 
sa data sa data 14 
sockaddr sa data 253 sa len 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































sa len . 
Sa family O U 
sa family 256 
AF INET Internet 
C | AF_ISO,AF_OSI OSI 
AF_UNIX Unix 
AF_ROUTE 000 
sockaddr AF_LINK 0000 
sa len|| sa family er 000) 
sa_data sa_data 0 3-19 sa family D 0 
| | 6 
Internet[] [] Sockaddr in | IP 
2. Osockaddr 
271-274 osockaddr[] 4.3BSD Reno sockaddr 
OSI 
OSI Net/3[] sockaddr 
osockaddr 
3.6 ifnet[ ifaddr[] [OD 
ifnet|| ifaddr|| | 
ifnet|| ifaddr 
ifnet|| ifaddr 
ifnet 
( ) 3-20 ifnet 
le softc[0]: 
ifnet() 
arpcom() 
0o00 le_softc() 
sl softc[0]: 
SLIP ifneti) | -1 aotret) 
loif: 
DO ifnet() 


03-20 [00000000 ifrt 00000 





60 TCP/IP 2 
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ifnet 
ifnet 
3-20 SLIP 
softc 0 
U D DD D 
arpcom([] 3-26) 
(ARP) 
le softc([] 3-25) LANCE 
|. Internet[] [] 
ifaddr 
in ifaddr[[ (6.50 0 Ü OSI stadar) - 
iso ifaddr osig [] | 
iso_ifadärt} 
ifaddr 03-21 0 DDD 0 DD 0 DD Internet] (] 
sockaddr_dl ( OSI J JJ RJ p D UJ DJ EJ 
) sockaddr_dl OSI[] ARP 
3-21 Internet OSI 3.11 
(ifaddr sockaddr 1d ) 
3.7 UU UU BL D U 
SLIP 
pdevinit pdevinit ([] 3-22) 
struct pdevinit pdevinit[] = ( 
{ slattach, 1 ), 
( loopattach, 1 ), 
{0,0} 
Y; 
ER device.h 
120 struct pdevinit ( 
121 void (*pdev attach) (int); /* attach function */ 
122 int pdev. count; /* number of devices */ 
123 ); 
device.h 
[] 3-22 [] [| pdevinit 
120-123 SLIP pdevinit pdev attach 
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slattach|| loopattach attach pdev_count 
SLIP 
SLIP 
main 3-23 
- init main.c 
70 main(framep) 
71 void *framep; 
72 4 
96 cpu_startup(); /* locate and initialize devices */ 
` 
172 /* Attach pseudo-devices. (e.g., SLIP and loopback interfaces) */ 
173 for (pdev = pdevinit; pdev->pdev_attach != NULL; pdev++) 
174 (*pdev->pdev attach) (pdev->pdev count): 
175 /* 
176 * Initialize protocols. Block reception of incoming packets 
177 * until everything is ready. 
178 */ 
179 S - splimp(); 
180 ifinit(); /* initialize network interfaces */ 
181 domaininit(); /* initialize protocol domains */ 
182 splx(s); 
231 /* The scheduler is an infinite loop. */ 
232 scheduler (); 
233 /* NOTREACHED */ 
234 } = š 
init_main.c 
O 3-23 main] pago 
70-96 cpu_startup 
97-174 pdevinit pdev_attach 
175-234 ifinit|| domaininit scheduler 
ifinit[] domaininit 7 
SLIP 
38 O00000 
cpu_startup 
3-24 
3 
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TCP/IP 2 
U U (0000 
ifnet if attach LANCED 00 —— 
3-25 le softc SLIP slattach 
ifnet ( 3-20) UU loopattach 
l. le_softc 0324 JI0000000 
69-95 if le.c le softc ( 

NLE ) sc ac arpcom 

sc ifl| sc addr ifnet 
arpcom(sc ac) 3-26 
if_le.c 


69 struct le softc { 
70 struct arpcom sc_ac; 
71 #define sc_if sc ac.ac if 


/* common Ethernet structures */ 
/* network-visible interface */ 


72 #define sc addr sc ac.ac enaddr /* hardware Ethernet address */ 



























































































































































































































































95 ) le softc[NLE]; 





03-25 [| [| le softe 





95 struct arpcom ( 













































































if le.c 


if ether.h 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































96 struct ifnet ac if; /* network-visible interface */ 
97 u char ac, enaddr[6]; /* ethernet hardware address */ 
98 Struct in addr ac ipaddr; /* copy of ip address - XXX  */ 
99 struct ether multi *ac multiaddrs; /* list of ether multicast addrs */ 
100 int ac multicnt; /* length of ac multiaddrs list */ 
101 }; EG 
if ether.h 
03-26 [| O arpcom 
2. arpcom 
95-101 arpcom ac_if ifnet 3-20 ac_enaddr 
cpu_startup LANCE 
leattach[]([] 3-27)[] ac ipadd 
IP 6.6 
IP 6.3[] ac multiaddrs ether multi 
ac multicnt 12 
3-27 LANCE 
106-115 LANCE leattach 
hp_device HP 
HP 
le ifnet (U 3201] ifp sc_if 
ifnet 3-27 
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if le.c 


106 leattach (hd) 
107 struct hp device *hd; 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































108 { 
109 struct lereg0 *ler0; 
110 struct lereg2 *ler2; 
111 struct lereg2 *lemem = 0; f 
112 struct le softc fle = &le softc[hd->hp unit]; 
113 struct ifnet *ifp = &le->sc_if; 
114 char *op; 
115 int i; 
126 #* 
127 .* Read the ethernet address off the board, one nibble at a time. 
128 */ 
129 cp = (char *) (lestd[3] + (int) hd->hp addr); 
130 for (i = 0; i < sizeof(le->sc_addr); i++) { 
131 le->sc_addr[i] = (*++cp & OxF) << 4; 
132 Cp++; 
133 le->sc_addr[i] [= *++cp & OxF; 
134 Cp++; 
135 } 
136 printf("le%d: hardware address %s\n", hd->hp unit, 
137 ether sprintf(le-»sc addr)); 
: a hes : TUR o — 
150 ifp->if unit = hd->hp unit; 
151 ifp->if name = "le"; 
152 ifp->if mtu - ETHERMTU; 
153 ifp->if init - leinit; 
154 ifp->if_reset = lereset; 
155 ifp-»if ioctl = leioctl; 
156 ifp->if output = ether output; 
157 ifp->if_start = lestart; 
158 ifp->if_flags = IFF_BROADCAST | IFF_SIMPLEX | IFF_MULTICAST; 
159 bpfattach(&ifp->if bpf, ifp, DLT EN10MB, sizeof (struct ether_header)); 
160 if attach(ifp); . 
161 return (1); 
162 } S 
if le.c 
[] 3-27 00 leattach 
3. 
126-137 LANCE (4 bit) 
sc addr([] sc_ac.ac_enaddr— 3-26) 
lestd hp_addr hp_addr 
LANCE 
printf 
4. ifnet 
150-157 leattach[| hp device if unit 












































64 



















































































China-pubıtom 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 
if name[]" le” [] if mtu[] 1500 (ETHERMTU) 
if init|] if reset[| if ioctl[|if outputl| it start 
4.1 
158 IFF BROADCAST[] LANCE 
IFF SIMPLE IFF MULTICAST 
159-162 bpfattach BPF 31-8 if attach 
ifnet (3.11[] ) 
39 SLIPD DO 
SLIP cpu startup main 
SLIP[] pdevinit pdev attach[][] slattach SLIP 
SLIP 3-28 sl_softc 
if_slvar.h 





43 struct sl softc { 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































44 struct ifnet sc if: /* network-visible interface */ 
45 struct ifqueue sc fasta; /* interactive output queue */ 
46 struct tty *sc ttyp; /* pointer to tty structure */ 
47 u char *sc mp; /* pointer to next available buf char */ 
48 u char *sc ep; /* pointer to last available buf char */ 
49 u char *sc buf; /* input buffer */ 
50 u int sc flags; /* Figure 3.29 */ 
51 u int Sc escape; /* =1 if last char input was FRAME ESCAPE */ 
52 struct slcompress sc comp; /* tcp compression data */ 
53 caddr t sc bpf; /* BPF data */ 
54 ); : 
if. slvar.h 
H 3-28 [O O sl softe 
43-54 sl_softc ifnet 
ifnet SLIP sc fastg 
sc ttyp sc_buf[] sc ep SLIP 
sc mp 
SLIP 4 3-29 
[] [] sc_softc{] l U U 

SC_COMPRESS sc_if.if_flags IFF LINKOO [| 0 TCPO O 

SC_NOICMP sc_if.if_flags IFF LINK1[] [| 0) ICMPT] O 

SC_AUTOCOMP sc_if.if_flags IFF LINK20 70 TCP] OOO 

SC ERROR sc flags 000000000090 

3-29 SLIP[] if flags [] sc flags |] 
SLIP[] ifnet 3 
sl softc 

sc escape IP (5.30) TCP (29.13 


























































































































































































































sc_comp 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































sc_bpf SLIP BPF 
sl softc[] slattach 3-30| 
135-152 leattach slattach 
slattach SLIP cpu, startup 
main pdev attach SLIP 
if mtu[] 296 (SLMTU) 20 IP 20 TCP 256 
(5.3 ) 
135 void if sl.c 
136 slattach() 
137 ( 
138 struct sl softc *sc; 
139 int i = O; 
140 for (sc = sl_softc; i < NSL; sc++) { 
141 sc->sc_if.if_name = "sl"; 
142 sc->sc_if.if_next = NULL; 
143 sc->sc_if.if_unit = i++; 
144 sc->sc_if.if_mtu = SLMTU; 
145 sc->sc_if.if_flags = 
146 IFF_POINTOPOINT | SC_AUTOCOMP | IFF_MULTICAST; 
147 sc->sc_if.if_type = IFT_SLIP; 
148 sc->sc_if.if_ioctl = slioctl; 
149 sc->sc_if.if_output = sloutput; 
150 sc->sc_if.if_snd.ifq_maxlen = 50; 
151 sc->sc_fastq.ifq_maxlen = 32; 
152 if attach(&sc->sc if); 
153 bpfattach(&sc->sc bpf, &sc->sc if, DLT SLIP, SLIP HDRLEN); 
154 ) 
155 } å 
if sl.c 
[] 3-30 [][] slattach 
SLIP slattachl] if flags 
IFF POINTOPOINT|| SC AUTOCOMP[| IFF MULTICAST 
SLIP| if snd 50 sc fastq 
32 3-42 if snd 50(ifqmaxlen) 
ifinit( 
3-42) 
if attach ifnet slattach[| sc if 
if attachl|sc if sl softcl|]ifnet 
slattach ( /etc/netstart) 
ioctl (5.3l] ) SLIP 
153-155 SLIP slattach bpfattach BPF 

















































































































310 00000 
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eca 



























































































































































































































































































































































































































































































































































































































































































































































































































































main pdevinit pdev_attach 
loopattach 3-31 loopattach 
if_loop.c 
41 void if_loop 
42 loopattach (n) 
43 int n; 
44 ( 
45 struct ifnet *ifp - &loif; 
46 ifp->if name = "lo"; 
47 ifp->if mtu = LOMTU; 
48 ifp-»if flags = IFF_LOOPBACK | IFF MULTICAST; 
49 ifp->if_ioctl = loioctl; 
50 ifp->if_output = looutput; 
51 ifp->if type = IFT_LOOP; 
52 ifp->if hdrlen - 0; 
53 ifp->if addrlen - 0; 
54 if attach(ifp); 
55 bpfattach(&ifp->if bpf, ifp, DLT NULL, sizeof(u int)); 
56 š 
i if loop.c 
NA HEDE BU 
41-56 if mtu 1536 (LOMTU) if flags IFF_LOOPBACK 
IFF_MULTICAST if hdrlen[| if addrlen 
O[] if attach ifnet bpfattach BPF 
MTU 1576(40 + 3X 512) TCP/IP Solaris 2.3 
MTU 8232(40 4 8X 1024) Internet 
40 







































































3.11 if_attach|] |] 


























































































































































































































































































































if_attach ifnet 
if attach 
3-32 if attach 
ifnet: le softc[0]: sl softc[0]: loif: 











ifnet() ifnet() 





ifnet addrs: 


ifaddr{} 


sockaddr dl() sockaddr_d1{} 
sockaddr dl() sockaddr dl() sockaddr_dl() 


[] 3-32 ifnet DI 





































































































































































































































































































































































































































































































































































































3-32 if attach le softc leattach 
sl_softc slattach ifnet 
loopattach ifnet ifnet 
ifaddr ( sockaddr dl 3-33) 
ifnet addrs 
if_dlh 
55 struct sockaddr_dl ( 
56 u_char sdl_len; /* Total length of sockaddr */ 
57 u_char sdl_family; /* AF LINK */ 
58 u short sål index; /* if !- 0, system given index for 
59 interface */ 
60 u_char sdl type; /* interface type (Figure 3.9) */ 
61 u char sdl_nlen; /* interface name length, no trailing 0 
62 read. */ 
63 u char sdl_alen; /* link level address length */ 
64 u char sdl_slen; /* link layer selector length */ 
65 char sdl data[12]; /* minimum work area, can be larger; 
66 contains both if name and 11 address */ 
67 Y; 


68 #define LLADDR(s) ((caddr_t) ((s)->sdl_data + (s)->sdl_nlen)) 


[] 3-33 [] [ sockaddr dl 







































































































































































if dL.h 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































3-20 le softc[0l]l] s1_softcl0] 
IP ifconfig 
(6.6[] ) 
( le0 48 
bit ) ARP[] OSI sockaddr dl 
ifaddr 
(ifa ifwithnet 6-32) 
sockaddr dl 3-33 
55=57 3-18[] sdl len sdl family 
AF LINK 
58  sdl index 3-32 1 SLIP 
2 3 if index 
60 sdl type ifnet if type 
61-68 ifnet if name|| if unit 
SLIP " s10” "owl" 
sdl data sdl nlen ( SLIP 3) 
LLADDR sockaddr dl 
sdl alen 
48 bit sockaddr dl 3-38 








































































































































































































sockaddr dl 
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Net/3 sdl_slen 
if_attach if_index 
ifnet_addrs ifaddr 
if_attach 3-34 5 
59-74 if attach ifp ifnet 
Net/3 ifnet ifnet 
while P 

ifnet ifnet if index||1 ifp 
-»if index 











60 if attach(ifp) 
61 struct ifnet *ifp; 






































































































































































































































































































































































































































62 { 
63 unsigned socksize, ifasize; 
64 int namelen, unitlen, masklen, ether output(); 
65 char workbuf[12], *unitname; 
66 struct ifnet **p = &ifnet; /* head of interface list */ 
67 struct sockaddr dl *sdl; 
68 struct ifaddr *ifa; 
69 static int if indexlim - 8; /* size of ifnet addrs array */ 
70 extern void link rtrequest(); 
71 while (*p) /* find end of interface list */ 
72 p = &((*p)-»if next); 
73 *p - ifp; 
74 ifp->if_index = ++if_index; /* assign next index */ 
75 /* resize ifnet_addrs array if necessary */ 
76 if (ifnet_addrs == || if index >= if_indexlim) { 
77 unsigned n = (if_indexlim <<= 1) * sizeof(ifa); 
78 struct ifaddr **q = (struct ifaddr **) 
79 malloc(n, M_IFADDR, M WAITOK); 
80 if (ifnet addrs) ( 
81 bcopy((caddr t) ifnet_addrs, (caddr t) q, n / 2); 
82 free((caddr t) ifnet addrs, M IFADDR); 
83 } 
84 ifnet_addrs = g; 
85 } 
oe fr 
U 3-34 QQ if attach 0900000090 
1. ifnet addrs 
75-85 if attach ifnet addrs 16(16=8<<1) 
if indexlim[| if attach if indexlim <<= 
3-34 malloc[] free € 




































































































































































































































































































































































malloc 











M WAITOK 





































































































































































































M DONTWAIT 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































if attach 3-35 
; " ; if.c 
86 /* create a Link Level name for this device */ 
87 unitname = sprint d((u int) ifp->if_unit, workbuf, sizeof (workbuf)); 
88 namelen = strlen(ifp->if name); 
89 unitlen = strlen(unitname); 
90 /* compute size of sockaddr_dl structure for this device */ 
91 #define _offsetof(t, m) ((int)((caddr t)&((t *)0)->m)) 
92 masklen = _offsetof (struct sockaddr dl, sdi data[0]) + 
93 unitlen + namelen; 
94 socksize = masklen + ifp->if_addrlen; 
95 #define ROUNDUP(a) (1 + (((a) - 1) | (sizeof(long) - 1))) 
96 socksize = ROUNDUP (socksize); 
97 if (socksize < sizeof(*sdl)) 
98 socksize = sizeof(*sdl); 
99 ifasize = sizeof(*ifa) + 2 * socksize; : 
if.c 
03-35 if attan [JD BD D T D D D D D 
2. 
86-99 if attach||if unit||if name sprint d|] if unit 
workbuf masklen|| sockaddr dl sdl data 
(namelen + unit DH socksize na 
socksize|l| masklen ifaddr{} 
(if_addrlen) (ROUNDUP) —< 
sockaddr_d1 
ockaddr_d1 ifasize ifaddr 
socksize 
sockaddr_d1 
if_attach [] 3-36 
3-36 i 
3-36 ifaddr sockaddr dl 
C 
3-36 in ifaddr ifaddr 
sockaddr sockaddr dl 
3-37 
3. 
100-116 bzero O sal ifnet[] JJ 
sockaddr dl 
sdl len sockaddr dl sdl family AF LINK 
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if_namell unitname sdl_data 
sdl_nlen sdl_index sdl_type 
ifnet_addrs ifa ifpl| ifa_addrlist 
ifnet sockaddr_dl|| ifa addr ifnet 
arp rtrequest link rtrequest 
loop rtrequest 19 21 ifa rtrequest[] arp rtrequest 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































linkrtrequest[| loop rtrequest 
Sockaddr dl 
: E Ze 
100 if (ifa = (struct ifaddr *) malloc(ifasize, M IFADDR, M WAITOK)) { 
101 bzero((caddr t) ifa, ifasize); 
102 /* First: initialize the sockaddr_dl address */ 
103 sdl = (struct sockaddr_dl +) (ifa + 1); 
104 sdl->sdl_len = socksize; 
105 sdl->sdl family = AF LINK; 
106 bcopy (ifp->if name, sdl-»sdl data, namelen); 
107 bcopy (unitname, namelen + (caddr t) sdl->sdl data, unitlen); 
108 sdl->sdl nlen = (namelen += unitlen); 
109 sdl->sdl index = ifp->if index; 
110 sdl->sdl type = ifp->if type; 
111 ifnet addrs[if index - 1] = ifa; 
112 ifa->ifa_ifp = ifp; 
113 ifa->ifa_next = ifp->if_addrlist; 
114 ifa->ifa_rtrequest = link_rtrequest; 
115 ifp->if addrlist = ifa; 
116 ifa->ifa_addr = (struct sockaddr +) säl; - 
117 /* Second: initialize the sockaddr dl mask */ 
118 sdl = (struct sockaddr dl *) (socksize + (caddr t) sdl); 
119 ifa->ifa netmask = (struct sockaddr +) sdl; 
120 sdl->sdl len = masklen; 
121 while (namelen != 0) 
122 sdl->sdl data[--namelen] = Oxff; 
123 H 4 
if.c 
0 3-37 DD ifattah DO 0000000000 
4. 
117-123 sockaddr_dl 
ifa netmask ifaddr ( 
JU while 1 
3-38 Sockaddr dl 
if namef] “ le"[]if unit[]O[] if index[] 1 
3-38 ether ifattach (U 3-41) 
3-39 if attach 
if attach ether ifattach 3-40 
124-127 ether_ifattach ( leattach) 
if_attach sockaddr_dl 
XXX 
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family slen 






































sockaddr dl() |lenjar -| index 00000 
(ifa ifaddr) | 20 vz 1 0x6/3|6l|olllelo 


1 1 2 1 1 1 1 nlen alen 3 bytes 
Son (600) i 
sockaddr dl() [len q 
(ifa_netmask) | 11 ff | f£) ff 


900 
je data{] —— 
masklen 
: nog 


03-38 00000000 sockaddr di OO (0D D D D. sdı_) 


ifnet: le_softc{} 
if_addrlist 





ifnet_addrs: 


ifaddr{} 
o — g 
1 |] 
2 _ | 


i£_indexlin | 


0 3-39 00000 if_attach [| [| ifnet [] sockaddr_dl DU 


if.c 
124 /* XXX -- Temporary fix before changing 10 ethernet drivers */ if 
125 if (ifp->if_output == ether output) 

126 ether ifattach(ifp); 

127 ) . 
ifc 





03-40 DO i£attach D 00000 


E LT MM jfethersubr.c 
338 void 


339 ether ifattach(ifp) 
340 struct ifnet *ifp; 


341 ( 

342 struct ifaddr *ifa; 

343 struct sockaddr dl *sdl; 

344 ifp->if type = IFT ETHER; 

345 ifp->if addrlen = 6; 

346 ifp->if hdrlen = 14; 

347 ifp->if mtu = ETHERMTU; 

348 for (ifa = ifp->if addrlist; ifa; ifa = ifa->ifa next) 
349 if ((sdl = (struct sockaddr dl +) ifa->ifa addr) && 


O 3-41 [| [| ether ifattach 
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350 sdl->sdl family == AF LINK) { 
351 sdl->sdl type = IFT ETHER; 
352 sdl->sdl alen = ifp->if addrlen; 
353 bcopy((caddr t) ((struct arpcom +) ifp)-»ac enaddr, 
354 LLADDR(sdl), ifp->if addrlen); 
355 break; 
356 } 
357 } 
nn if ethersubr.c 
03-41 (0) 
5. ether ifattach 
ether ifattach ifnet 
338-357 if type[| IFT_ETHER 6 
U 14 MTU[] 1500 (ETHERMTU) 
leattach MTU 
4.3 for 
sockaddr_dl 
arpcom 
3.12 ifinit[ [|] 
main ([] 3-23) ifinit 3-42 
if.c 
43 void if. 
44 ifinit() 
45 ( 
46 struct ifnet *ifp; 
47 for (ifp = ifnet; ifp; ifp = ifp->if_next) 
48 if (ifp-»if snd.ifq maxlen == 0) 
49 ifp->if_snd.ifq_maxlen = ifqmaxlen; /* set default length */ 
50 if_slowtimo (0); 
51} š 
if.c 
O 3-42 QQ ifinit 
43-51 for attach 
50 (ifqmaxlen) 
sendto 65 507 45 
if slowtimo 
if timer 0 3-43 if slowtimo 
338-343 if slowtimo arg (7.4[] ) 
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if.c 
338 void if. 
339 if_slowtimo (arg) 
340 void *arg; 
341 { 
342 struct ifnet *ifp; 
343 int s = splimp(); 
344 for (ifp = ifnet; ifp; ifp = ifp->if next) { 
345 if (ifp->if timer == 0 || --ifp->if timer) 
346 continue; 
347 if (ifp->if watchdog) 
348 (*ifp->if watchdog) (ifp->if unit); 
349 ) 
350 splx(s); 
351 timeout (if_slowtimo, (void *) 0, hz / IFNET_SLOWHZ); 
352 } š 
if.c 
03-43 [| [| if slowtimo 
344-352 if slowtimo if timer[] Ü if timer 0 
if_slowtimo[] if_timer|] 1 0 if_watchdog 
if_slowtimo splimp ip_slowtimo 
timeout hz/IFNET_SLOWHZ hz[] 1 
( 100) IFNET SLOWHZ 1 
if slowtimo 
timeout callout [Leffler er al. 1989] 
3.13 IN 
ifnet|| ifaddr 
ifnet ifnet | ifnet 
if addrs 
sockaddr sa_family|| sa_len 















































































































































sockaddr_dl 






























































































































































































































































U U 









































































































































































































































































































































































































































































































































































































































3.1 Uniz netstat 
netstat -i (if name) 
(if mtu) 
3.2 if slowtimo ([] 3-43) splimp[| splx 
| | 
3.3 SLIP 
34 if hdrlen[] if_addrlen slattach 
3.5 SLIP 3-38 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































41 00 
3000 i 0 i i 0 U U U U U [] 
U U U U U U | U U | U U 
toctl 5 SLIP 
1 000[] C ( 
JO Hl 
OM uu E OO Net/3[] [] U [ODO ut 
[] 0 0 OO 4-10 Net/3[] 0 
LANCE 
U ifnet (U 3-6) 70 4-2 
42 
DEC DEUNA[] QJ vax/if/if de.c 
3Com[] [] O00 vax/if/if ec.c 
Excelan EXOS 204[] [] vax/if/if ex.c 
Interlan[] 0000000 vax/if/if il.c 
Interlan NP100 0000000 vax/if/if ix.c 
Digital Q-BUS to NID 0 O vax/if/if qe.c 
CMC ENP-20[] 00000 tahoe/if/if_enp.c 
Excelan EXOS 202 (VME) & 203 (QBUS) tahoe/if/if_ex.c 
ACC VERSAbus DO 0 00 tahoe/if/if_ace.c 
AMD 7990 LANCE [J hp300/dev/if_le.c 
NE20009 0 f] i386/isa/if_ne.c 
Western Digital 80030 I 00 00 i386/isa/if_we.c 
041 Ne/3] OOOOOU00000 
ifnet Oo oO O SLIP O O O O 
if init leinit D d D D ü 
if output ether output slouput looutput 000000000000 
if start lestart D OO UO B 
if done D DDD (00) 
if_ioctl leioctl slioctl lcioctl 00000000 ioeti[ O 
if_reset lereset OOO00000000 
if watchdog OOO0O0000000000 


















































042 OOO00000000 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































UULU if output[] if_ioctl|] JOD if init[]if done 
if reset UDE | UDE U ( leinit [| leioctl 
) if start] |] ether output[][] 
4.2 OOOO 
| ioctl CO D I 
4-3 
O O [] O 
net/if_ether.h 00000 
net/if.h ioctlf 0 H 
net/if_ethersubr.c 000000 
hp300/dev/if_le.c LANCE" 000000 
net/if.c ioctl[l[] 
043 OO000000 
4.2.1 GOOG 
DO 4-4 0 LANCE LU L 
O U U 0 0 0 O O 
arpintrq struct ifqueue ARPIT 0 0 Ü 
clnlintrq struct ifqueue CLNPO OOO 
ipintrq struct ifqueue IP] UU ED Ú 
le_softc struct le_softc[[ LANCE) [I 0 00 
etherbraodcastaddr | u_char[] U DU U 0 D 
044 000000000 
le softc uut 
4.2.2 | 
| ifnet | U 4-50 0 
4-6 [] netstat[] ifnet | | 
1 E if name[] if unit (O OO IFF UP) 
4-6 s10[] s12[] s13 0 
2 if mtu [| ^ Network” [| " Address” 
sockaddr_dl|| sdl data IP 
if ipacketsl|if ierrorsl|if opackets|| 
if oerrors[| if_collisions|]| 
s [1 E] E] [] 3% (942 798 / 23 234 729 = 3%) 
° SLIP SLIP 
. LANCE 12 






























































































































































































































































76 TCP/IP 20 | Chinaspub.tom 
aaa 
















































































TU ] d OD SNMP 
if collisions 0 CSMA[I 0 0 DD 0 
if ibytes OOOOO0000 g 
if_ierrors D 0 D DDD DDD D 0 0 ° 
if_imcasts O0O0000000 s 
if_ipackets OO0OO0000000 s 
if_iqdrops O0O0000000000 ° 
if_lastchange O0O00000000 ° 
if_noproto OO0OO00000000 * 
if obytes OOOOOO0 * 
if oerrors OOOO0000 ° 
if_omcasts U D D DDD 0 D ° 
if_opackets 0000000000 S 
if snd.ifq drops | 00000000000 ° 
if snd.ifg len 0000000090 

045 DD mer UDUUUDUU 











netstat -i output 
x—————_—>—— _ — _ ___—_——_—__________——— 


Network Address Ipkts Ierrs Opkts Oerrs Coll 
leo 1500 <Link>8.0.9.13.d.33 28680519 814 29234729 12 942798 



















leo 1500 128.32.33 128.32.33.5 28680519 814 29234729 12 942798 

296 <Link> 54036 0 45402 0 0 
296 128.32.33 128.32.33.5 54036 0 45402 0 0 
296 <Link> 40397 0 33544 0 0 
296 128.32.33 128.32.33.5 40397 0 33544 0 0 
296 <Link> 0 0 0 0 0 
296 <Link> 0 0 0 0 0 
1536 <Link> 493599 0 493599 0 0 

127 127.0.0.1 493599 0 493599 0 0 





046 DO00000 

























































































































































































































































































































































































































































































































































































































































































° 814 
4.2.3 SNMP 
4-7 SNMP (ifTable) (ifEntry) 
ifnet 
ISODE SNMP if_type ifSpeed ifAdminStatus 
ifLastChange | ifnet if lastchange g 
U U U U U ifSpecific 
000000 =<ifíndex> 
SNMP] [] ifnet[] [] O 0 
ifIndex if_index O000000 
ifDescr if name 0000000 
ifType if_type D0000 (000000 sry» 

















047 000 ifrable O00 





Chinaspubscom , 77 






















































































000000 =<ifíndex> 

SNMP) D ifnet[] D Oo D 
ifMtu if mtu OOO MTU ([] D ) 
ifSpeed (000 ) OOOOOOO (0000) 
ifPhysAddress ac enaddr 0000 (0000 arpcom) 
ifAdminStatus 000) OOOO000GrrvrPOD) 
ifOperStatus if flags OOOOOODOGrFr ve[ tu» 
ifLastChange (400 ) D D 0000000 
ifInOctets if_ibytes U D DD DD 
ifInUcastPkts if ipackets -if imcast500000900 
ifInNUcastPkts if imcasts OGOO00000000 
ifInDiscards if igdrops U DD DD DDD DDD DD 0 
ifInErrors if_ierrors U C O D 0 DI 
ifInUnknownProtos | if noproto DU DD D DDD DDD 
ifOutOctets if obytes U D D D 
ifOutUcastPkts if opackets-if omcasts U U 000 D 0 
ifOutNUcastPkts if_omcasts 000000000000 
ifOutDiscards if snd.ifg drops 000000000000 000 
ifOutErrors if oerrors O000000000000 
ifOutQLen if snd.ifq len 000000 
ifSpecific n/a U D DUU DD SNMPD D IDO D D ) 






























































0:47 däi 


43 00000 


Net/3[] 0 LU 


















































L L 0000000000 Unix| OD Hd 









































































































































































































































































































































































































































































































































































































































































































































mo | 009 po] ev Te 
n H ein TT 46-1500] 0 : 400 
10 
2 46-1500[] [] 
048 D.0 r000 E0000 
D 48 bit[] OOOOOODO 16 bit[] LU LU U U U 00 0 U 
00000000 P000000 0x0800(20480 0000000 32 bit] CRC D 
000) 
00000000000000 0 19820 0 Digital] D D D D Intel 00 0 
conan 00000 TCPIPH 0000000000 00000000 IEEE( 
00000000 802.20 802.30 0 O D 0 D TEEED D D 0 [Stallings 198710 






















































































78 TCP/IP 2 China-pubıcom 
A nn ov 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































IP RFC 894[Hornig 1984] 802.3 
RFC1042[Postel[] Reynolds 1988] 
48 bit IP ARP (RFC 
826 [Plummer 1982]) 21 IP RARP (RFC 
903 [Finlayson et al. 1984]) 
DECNET DECNET 
4-9 
E if output 
OSI 
00 O23) 
een | e El 


ipintrg: a 


le softc[0]: 


leread 


arpcom{} / ===] 
pon 
MATA 


0000 0000 
00 


049 200022002000 







































































(leintr) 






















































































(ARPO O) 






























































(le softc[0])[] le softc 
4-9 OSI (elnl) IP[] ARP 










































































































































































ether input 





















































clnlintrq 






































































































































OSI (CLNP CLNL) Net/3 
CLNP ISO 8473[] [Stallings 1993] 










































































































































































































































































4-9 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ifnet|| arpcom 
LANCE 3-6 ifnet 3-26 
arpcom 
4.3.1 leintr 
leintr 
leintr 
12 ( 
) 
1 tcpdump BPF (BSD ) 
leintr leread 
mbuf ([] m devget) ( 
) leintr lestart 
ether input 
mbuf 
ether input ether header 4-10 
38-42 CRC CRC 
ether type 
if ether.h 
38 struct ether header { 
39 u char ether dhost[6]; /* Ethernet destination address */ 
40 u char ether shost[6]; /* Ethernet source address */ 
41 u short ether type; /* Ethernet frame type */ 
42 Y; i 
if ether.h 
[] 4-10 [ [| ether header 
4.3.2 leread 
leread([] 4-11) leintr 
ether header mbu leread 
BPF 
if le.c 


528 leread(unit, buf, len) 


529 
530 
531 
532 
533 


int unit; 
char *buf; 
int len; 


{ 


struct le softc *le = Sie softc[unit]; 


[] 4-11 


O O 1eread 


80 


534 
535 
536 


537 
538 
539 
540 
541 
542 


543 
544 
545 
546 
547 
548 
549 
550 
551 
552 
553 
554 
555 
556 
557 


558 
559 
560 
561 


562 
563 


564 
565 
566 
567 
568 


569 
570 
571 
572 
573 
574 
575 
576 
577 
578 
579 
580 
581 
582 
583 
584 
585 } 





528-539 





Chinaspub.tom 


TCP/IP 2 









































struct ether_header *et; 
struct mbuf *m; 
int off, resid, flags; 


le->sc if.if ipackets++; i 

et = (struct ether header *) buf; 

et->ether_type = ntohs(fu short) et->ether_type); 

/* adjust input length to account for header and CRC */ 
len = len - sizeof(struct ether header) - 4; 

off = 0; 


if {len <= 0) { 
if (ledebug) 
log (LOG_WARNING, 
"le$d: ierror (runt packet): from Ss: len=%d\n", 
unit, ether sprintf(et->ether shost), len); 
le->sc runt++; 
le->sc if.if ierrors++; 
return; 
) 
flags = 0; 
if (bemp((caddr_t) etherbroadcastaddr, 
(caddr t) et->ether dhost, sizeof (etherbroadcastaddr)) == 0) 
flags |= M BCAST; 
if (et->ether dhost[0] & 1) 
flags |= M MCAST; 


/* 
* Check if there's a bpf filter listening on this interface. 
* If so, hand off the raw packet to enet. 
EJ 
if (le->sc_if.if_bpf) { 
bpf_tap(le->sc_if.if_bpf, buf, len + sizeof(struct ether header)); 


/* 

* Keep the packet if it's a broadcast or has our 
* physical ethernet address (or if we support 

* multicast and it's one). 














*/ 
if ((flags & (M_BCAST | M_MCAST)) == 0 && 
bcmp (et->ether dhost, le->sc_addr, 
sizeof (et->ether_dhost)) !- 0) 
return; 

} 

/* 

* Pull packet off interface. Off is nonzero if packet 

* has trailing header; m devget will then force this header 

* information to be at the front, but we still have to drop 

* the type and length which are at the front of any trailer data. 

*/ 
m = m_devget ((char *) (et + 1), len, off, &le->sc_if, 0); 

if (m == 0) 

return; 
m->m_flags |= flags; 
ether_input (&le->sc_if, et, m); 
if_le.c 
4-11 (0) 
leintr|| leread unit 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































buf len ( CRC) 
et 
ether_header 
540-551 len CRC (runt packet)[] [] 
552=557 
etherbroadcastaddr 
u char etherbroadcastaddr[6] = OZEE; Oxff, Oxff, Oxff, Oxftf, Oxff ); 
C 48 bit 8 bit 
— ANSI C 
bcmp etherbroadcastaddr|| ether dhost M BCAST 
4-12 
0 78 15 16 23 24 3132 39 40 47 
ether dhost U | wer tuns casetas Ecos tuse FT osa s] 
48 bit 0000 
O00000000 
0412 JOO00000000 
12 IP IP 
mbuf M MCAST 
ether input 48 bit 
( 4.1) 
558-573 BPF bpf_tap BPF SLIP 
BPF ( ) 
BPF 
leread 
574-585 m_devget (2.6[] ) leread mbu 
m_devget 
m_devget leread 
mbuf| ether_input 
4.3.3 ether input 
ether input 4-13 ether header 
1. 
196-209 ether_input ifp ifnet 
eh m ( 
) 






































62 





TCP/IP 2 


























Chinaspubecom 










































































































































































































































































ifconfig(8) (6.6[] ) 
































196 
197 
198 
199 
200 
201 
202 
203 
204 
205 


206 
207 
208 
209 
210 


211 
212 
213 
214 
215 
216 
217 
218 


219 
220 
221 
222 
223 


224 
225 
226 
227 


228 
229 
230 
231 
232 


307 


308 
309 
310 
311 
312 
313 
314 
315 





if_ethersubr.c 


eh->ether_dhost, 





































































































































































































































































































void 
ether_input (ifp, eh, m) 
struct ifnet *ifp; 
struct ether header *eh; 
struct mbuf *m; 
{ 
struct ifqueue *ing; 
struct llc *1; 
Struct arpcom *ac - (struct arpcom *) ifp; 
int S; 
if ((ifp-»if flags & IFF UP) -- 0) ( 
m freem(m); 
return; 
} 
ifp->if_lastchange = time; 
ifp->if_ibytes += m->m_pkthdr.len + sizeof (*eh); 
if (bcmp((caddr t) etherbroadcastaddr, (caddr_t) 
sizeof (etherbroadcastaddr)) == 0) 
m->m flags |= M_BCAST; 
else if (eh-»ether dhost[0] & 1) 
m-»m flags |- M MCAST; 
if (m-»m flags & (M BCAST | M MCAST)) 
ifp->if imcasts++; 
switch (eh->ether type) ( 
case ETHERTYPE IP: 
schednetisr(NETISR IP); 
ing = &ipintrg; 
break; 
case ETHERTYPE_ARP: 
Schednetisr(NETISR ARP); 
inq - &arpintrq; 
break; 
default: 
if (eh->ether type > ETHERMTU) { 
m freem(m); 
return; 
} 
} 
s = splimp(); 
if (IF QFULL(inq)) { 
IF DROP (ing); 
m freem(m); 
) else 
IF ENQUEUE (inq, m); 
splx(s); 
} 


[] 4-13 D [] ether input 














if_ethersubr.c 














210-218 
















































































Unix 



































time timeval 
(19700 10 10 00:00:00 [UTC]) 
Ramsey 1993] | 0 UTC Net/3 | | 
struct timeval 


long tv sec; 


long tv usec; 


y; 


























































































































































































































































































































/* seconds */ 


/* and microseconds */ 




















































































































[Itano and 


timeval 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ether_input if_lastchange if_ibytes 
( 14 ) 
ether input leread 
| 0 BPFI] [] L ether input 
2. 
219-227 ether inpu IP schednetisr 
IP IP ipintrg ARP ARP 
arpintrq 
isr 
| U BSD 0 ARP Il | [U arpinput 
BPF Net/3 RARP 
BPF 
228-307 
( H OSI ) 0-1500 IEEE 802.3 length] [] 
802.3[] length 1501-65535 | HDD spe] D D 
2048 IP] O 
802.3 ( 2045 ARPIT [| 
OSI [Stallings 1993] OSI 04-14 0000 op 00 
802.3[] length] [] 
4-14 RFC 
1700 [Reynolds and Postel 1994] 
3.0 
308-315 ether_input 
7-23 21-16 IP[] ARP 50[] (ipqmaxlen) 
ether_input 
schednetisr (1.12[] ) 
U ipintr IP L arpintr ARP 


























84 


4.3.4 ether_output 


TCP/IP 2 
























































China-pubecom 



































IP ifnet 





































































































if outputl|ether output 













































































































































































































































































































































































































































































4-15 





















































E To if ethersubr.c 


49 int 

50 ether output (ifp, m0, dst, rt0) 
51 struct ifnet *ifp; 

52 struct mbuf *m0; 

53 struct sockaddr *dst; 

54 struct rtentry *rt0; 


55 ( 

56 short type; 

57 int s, error 2 0; 

58 u char edst[6]; 

59 struct mbuf *m = m0; 

60 struct rtentry *rt; 

61 struct mbuf *mcopy = (struct mbuf *) 0; 

62 struct ether_header *eh; 

63 int off, len = m->m_pkthdr.len; 

64 struct arpcom *ac = (struct arpcom *) ifp; 

65 if ((ifp->if flags & (IFF UP | IFF RUNNING)) != (IFF UP | IFF RUNNING) ) 
66 senderr (ENETDOWN) ; 

67 ifp->if lastchange = time; 

68 if (rt = rto) { 

69 if ((rt->rt_flags & RTF_UP) == { 

70 if (rt0 = rt = rtalloci(dst, 1)) 

71 rt->rt_refent--; 

72 else 

73 senderr (EHOSTUNREACH) ; 

74 } 

75 if (rt->rt_flags & RTF_GATEWAY) { 

76 if (rt->rt gwroute == 0) 

77 goto lookup; 

78 if (((rt = rt->rt gwroute)->rt flags & RTF UP) == 0) ( 
79 rtfree(rt); 

80 rt = rt0; 

81 lookup: rt-»rt gwroute = rtallocl(rt-»rt gateway, 1); 
82 if ((rt = rt-»rt gwroute) == 0) 

83 senderr (EHOSTUNREACH); 

84 } 

85 } 

86 if (rt->rt_flags & RTF_REJECT) 

87 if (rt-»rt rmx.rmx expire == 0 || 

88 time.tv sec « rt-»rt rmx.rmx expire) 

89 senderr(rt == rt0 ? EHOSTDOWN : EHOSTUNREACH); 
90 } 


I... Bf ethersubr.c 
04-15 [| [ ether output OOO 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































49-64 ether output ifp ifnet mo 
dst rto 
65-67 ether_output senderr 
#define senderr (e) error = (e); goto bad;) 
senderr bad ether_ 
output error 
ether_output 
ENETDOWN 
1. 
68-74 rto ip_output ether_output BPF 
ether outputl] rto 4-16 
EHOSTUNREACH 
rtOl|rt 
- - if ethersubr.c 
91 switch (dst->sa family) { 
92 case AF INET: 
93 if (larpresolve(ac, rt, m, dst, edst)) 
94 return (0); /* if not yet resolved */ 
95 /* If broadcasting on a simplex interface, loopback a copy */ 
96 if ((m->m_flags & M_BCAST) && (ifp->if_flags & IFF_SIMPLEX)) 
97 mcopy = m_copy (m, 0, (int) M_COPYALL); 
98 off = m-»m pkthdr.len - m->m len; 
99 type = ETHERTYPE IP; 
100 break; 
101 case AF ISO: 
142 case AF UNSPEC: 
143 eh = (struct ether header *) dst->sa data; 
144 bcopy((caddr t) eh-»ether, dhost, (caddr t) edst, sizeof(edst)); 
145 type - eh-»ether type; 
146 break; 
147 default: 
148 printf("%s%d: can't handle af%din", ifp->if name, ifp->if unit, 
149 dst-»sa, family); 
150 senderr (EAFNOSUPPORT) ; 
151 ) å 
if ethersubr.c 
U 4-16 [| [| ether output [00000 
2, 
75-85 ( ) 
rt EHOSTUNREACH rt 
3: ARP 
86-90 ARP ARP RTF REJECT 

























































































































































































66 
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TCP/IP 2 
21-24 
ether_output 
ether_output IP 
ARP (210) 4-16 ARP 
4. IP 
91-101 ether output sa family 4-16 
case| | AF INET|| AF ISO[| AF UNSPEC case AF I SP 
case AF INET arpresolve TP 
ARP arpresolve 1 ether_output 
IP ARP ARP in_arpinput 
ether_output 
ARP ether_output 
( ) m_copy 
switch 
12 
5. 
142-146 ARP 
AF_UNSPEC dst bcopy edst 
type arpresolve([] AF_INET) 
6. 
147-151 ether_output EAFNOSUPPORT 
4-17 ether_output 
- if ethersubr.c 
152 if (mcopy) 
153 (void) looutput (ifp, mcopy, dst, rt); 
154 FE 
155 * Add local net header. If no space in first mbuf, 
156 * allocate another. 
157 */ 
158 M PREPEND (m, sizeof(struct ether_header), M_DONTWAIT); 
159 if (m == 0) 
160 senderr (ENOBUFS) ; 
161 eh = mtod(m, struct ether header *); 
162 type - htons((u short) type); 
163 bcopy((caddr t) &type, (caddr t) &eh->ether type, 
164 sizeof (eh->ether_type)); 
165 bcopy((caddr t)edst, (caddr t)eh->ether dhost, sizeof (edst)); 
166 bcopy ( (caddr t)ac-»ac enaddr, (caddr t)eh->ether shost, 
167 sizeof (eh->ether_shost)); ; 
if_ethersubr.c 
04-17 00 ether output [10 H H 
7. 
152-167 switch 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































looutput looutput[] 5.4 
M PREPEND 14 
mbu M PREPEND 
( 16.7 UDP sosend[] 13.6 igmp sendreport) 
ether output[] typel[] edst[] ac enaddr([] 3-26) 
ac enaddr 
ether header ac enaddr ether header 
mbu 32 bit CRC CRC 
4-18 
if ethersubr.c 

168 S = splimp(); 

169 /* 

170 * Queue message on interface, and start output if interface 

171 * not yet active. 

172 */ 

173 if (IF QFULL(&ifp->if snd)) ( 

174 IF DROP(&ifp-»if snd); 

175 splx(s); 

176 senderr (ENOBUFS) ; 

177 ) 

178 IF_ENQUEUE (&ifp->if_snd, m); 

179 if ((ifp->if_flags & IFF_OACTIVE) == 0) 

180 (*ifp->if start) (ifp); 

181 splx(s); 

182 ifp->if_obytes += len + sizeof(struct ether_header) ; 

183 if (m->m_flags & M_MCAST) 

184 ifp->if_omcasts++; 

185 return (error); 

186 bad: 

187 if (m) 

188 m freem(m); 

189 return (error); 

190 ) ; 

if ethersubr.c 
[]4-18 [| [| ether output 00000 
168-185 ether output ENOBUFS 
if start 
186-190 senderr bad 
4.3.5 lestart 
lestart LANCE 
ether output([] 4-18) 
if start lestart 
lestart 
lestart 






























































































































































































































































359 le->sc_txcnt LETBUF lestart 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































LANCE LETBUF 

le->sc_txcnt 

5. 
360-362 lestart|| ifnet IFF_OACTIVE 

[Jacobson 1998a] 
LANCE ( ) 
NFS NFS UDP ( 
8192 ) IP LANCE 
NFS UDP 
Jacobson Sun[] LANCE 

44 ioctif Hn 

ioctl 

ioctl 

int ioctl(int fd, unsigned long com,...); 

fd 
ioctl com = " 

ioctl 
ioctl 
15[] 
17 ioctl | ioctl 
ioctl 
ioctl 4-200 [| 





































































































































































































SIOCGIFCONF struct ifconf f ifconf 0000000 
SIOCGIFFLAGS struct ifreg *| ifioctl 00000 
SIOCGIFMETRIC struct ifreq *| ifioctl 00000 
SIOCSIFFLAGS struct ifreg zl ifioctl 00000 
SIOCSIFMETRIC struct ifreq *| ifioctl 00000 
[] 4-20 [] O iocti [] LH O 
ioctl ( com) 
















































































































































































































































































ioctl 
































































































































































































































90 TCP/IP 2 China-pubtom 
e 100 







































































| 


if ioctl 





0421 000000 iesti UD 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































4.4.1 ifioctl 
ioctl 4-20 5 4-22 ifioctl 

394-405 SIOCGIFCONF|| ifioctl ifconf ifreq 
406-410 ioctl ifreq ifunit 
ifnet ifr->ifr name ( “s10"0“ lei" 

“ 100") ifioctl ENXIO cmd 

4-29 
447-454 ioctl ifioctl 
IP UDP udp_usrreg 
















































































Chinaspubcon 9] 

























































































6-10 23.10 udp usrreq 











































































































switch 0 























if.c 


394 int 

395 ifioctl(so, cmd, data, p) 
396 struct socket *so; 

397 int cmd; 

398 caddr t data; 

399 struct proc *p; 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































400 ( 

401 struct ifnet *ifp; 

402 struct ifreq *ifr; 

403 int error; 

404 if (cmd == SIOCGIFCONF) 

405 return (ifconf (cmd, data)); 

406 ifr = (struct ifreq *) data; 

407 ifp = ifunit (ifr->ifr_name); 

408 if (ifp == 0) 

409 return (ENXIO); 

410 switch (cmd) { 

447 default: 

448 if (so->so_proto == 0) 

449 return (EOPNOTSUPP); 

450 return ((*so->so_proto->pr_usrreg) (so, PRU_CONTROL, 
451 cmd, data, ifp)); 
452 } 

453 return (0); 


04-22 [] [| ifiocti D 0 O O SIOCGIFCONF 





4.42 ifconf 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ifconf 

ifreql] ifconf 4-23 4-24 
262-279 ifreq ifr name 

ioctl 
292-300 ifconf ifc lenu ifc buf 

ifconf ifreq ifconf 
ifr addr ifreq ifreq 
ifr addr( Sockaddr ) Sockaddr 
sa len 4-25 ifconf 
4-25 

4-26 ifconf 

462-474 ifconf cmd data ifconf 


















































































































































































































































92 muu n: China+pub.tom 
TT 





if.h 
262 struct ifreq ( 
263 #define IFNAMSIZ 16 
264 char ifr name[IFNAMSIZ]: /* if name, e.g. "en0" */ 
265 union { 
266 struct sockaddr ifru addr; 
267 struct sockaddr ifru dstaddr; 
268 struct sockaddr ifru, broadaddr; 
269 short ifru_flags; 
270 int ifru_metric; 
271 caddr_t ifru_data; 
272 y ifr ifru; e 
273 #define ifr addr ifr_ifru.ifru_addr /* address */ 
274 #define ifr_dstaddr ifr_ifru.ifru_dstaddr /* other end of p-to-p link */ 
275 #define ifr_broadaddr ifr ifru.ifru broadaddr /* broadcast address */ 
276 #define ifr flags ifr ifru.ifru flags /* flags */ 
277 #define ifr metric ifr ifru.ifru metric /* metric */ 
278 #define ifr data ifr ifru.ifru data /* for use by interface */ 
279 ); 


O 4-23 QQ ifreq 


————————— 07 


292 struct ifconf ( 


293 int ifc len; /* size of associated buffer */ 
294 union ( 

295 caddr t ifcu buf; 

296 struct ifreq *ifcu req; 

297 ) ifc ifcu; 


298 #define ifc buf ifc ifcu.ifcu buf /* buffer address */ 
299 #define ifc req ifc ifcu.ifcu req /* array of structures returned */ 
300 }; 





if.h 
U 4-24 [| [| ifconf 


ifc 






data (process) 








ifconf() ifconf() 












= [wed [uoemaddr int) | 
[wet  — [aockadāz isot — 
[wet fæockaddr 810) | 





ep 


UD D 


04-25 ifconf 0000 








China-pubecom 93 



























































462 int if.c 
463 ifconf(cmd, data) 

464 int cmd; 

465 caddr t data; 

466 { 

467 struct ifconf *ifc = (struct ifconf *) data; 

468 struct ifnet *ifp = ifnet; 

469 struct ifaddr *ifa; 

470 char *cp, "ep; Y 
471 struct ifreg ifr, *ifrp; i 

472 int space = ifc->ifc len, error = 0; 

473 ifrp = ifc-»ifc req; 

474 ep = ifr.ifr_name + sizeof(ifr.ifr_name) - 2; 

475 for (; space > sizeof(ifr) && ifp; ifp = ifp->if_next) { 

476 strncpy(ifr.ifr name, ifp->if name, sizeof(ifr.ifr name) - 2); 
477 for (cp = ifr.ifr name; cp « ep && *cp; cp++) 

478 continue; 

479 *cp++ = "Dir + ifp->if unit; 

480 *cp = "NO"; 

481 if ((ifa = ifp->if_addrlist) == 0) { 

482 bzero((caddr t) & ifr.ifr_addr, sizeof(ifr.ifr addr)); 
483 error - copyout((caddr t) & ifr, (caddr t) ifrp, 

484 sizeof(ifr)); 

485 if (error) 

486 break; 

487 space -= sizeof(ifr), ifrp++; 

488 ) else 

489 for (; space > sizeof(ifr) && ifa; ifa = ifa->ifa next) ( 
490 struct sockaddr “sa = ifa->ifa addr; 

491 if (sa->sa len <= sizeof(*sa)) { 

492 ifr.ifr addr - *sa; 

493 error - copyout((caddr t) & ifr, (caddr t) ifrp, 
494 sizeof(ifr)); 

495 ifrp++; 

496 ) else ( ` 

497 space -= sa->sa len - sizeof(*sa); 

498 if (space < sizeof(ifr)) 

499 break; 

500 error = copyout((caddr t) & ifr, (caddr t) ifrp, 
501 sizeof(ifr.ifr name)); 

502 if (error == 0) 

503 error = copyout((caddr t) sa, 

504 (caddr t) & ifrp->ifr addr, sa->sa len); 
505 ifrp - (struct ifreq *) 

506 (sa->sa len + (caddr t) & ifrp->ifr addr); 
507 } 

508 if (error) 

509 break; 

510 space -= sizeof(ifr); 

511 } 

512 } 

513 ife->ifc len -= space; 

514 return (error); 


04-26 [| [| ifconf 





























































































































ifc ifconf dat all ifp[] ifnet ( ) 















































94 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
ifa cpll ep ifr ifr 
ifreq ifrq 
space cp 
ep 
475-488 for ifr_name 
ifr_name if_unit 0 
ifreg space ifrp 
489-515 for ifr 
ifr sockaddr A Er 
spacell ifrp 
(ifc->ifc len) ifconf ioctl ifconf 
ifconf 
4.4.3 
4-27 SLIP 
ifnet: le softc[0]: sl softc[0]: loif: 









ifnet() 





Sockaddr dl() 

















4-28 




































































ifc 











struct ifconf ifc; 
char buffer[144]; 


int s; 


buffer 


/* any socket */ 


ifc.ifc len - 144; 


ifc.ifc buf 
if (ioctl(s, 


buffer; 


perror ("ioctl failed"); 
exit (1); 




















SIOCGIFCONF, &ifc) < 0) ( 


ifnet{} 


ifaddr() 


sockaddr_d1{} 


sockaddr dl() 


0427 00000000 



































/* SIOCGIFCONF adjusts this */ 
/* contains interface addresses when ioctl returns */ 





faddr{} 


sockaddr_dl() 


sockaddr dl() 




































SIOCGIFCONF 
















































































































































































4-28 











































































































108 (3x 36) 

















ioctl 














ifc len 











China-bubcom 95 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































144 108 sockaddr_dl 36 
16 16 3 
&ifc 
ifconf() 
ifc_len 108 
ifc buf 
ifr name[] ifr addr === sl 
F aep 0 ) (200 Ü ) _ 
1|e|o 2018| 1 |6|s|ejO 1|]e|o| 00000 3600 
s|ılo 018 2 pelaloljolslılo 3600 
1lojo 018! 3 2431/0|0!1|0|0 a 360 Ú 
— — 360 D 
H 4-28 srocGrrcoNr 000000 
ifr addr sockaddr (20 ) 
(18[] AF LINK) sdl index sdl type 
([] IFT ETHER[] IFT SLIP[] IFT LOOP 60) 280 24) 
sa nlen( J)] sa alen( JN sa slen( 
) sa nlen 3 sa alen[] 6 SLIP 
sa alen[] ol sa slen 0 
( JU SLIP 
sockaddr dl 
sockaddr dl ( 4-27 ) 
( IP[] OSI ) 
sockaddr dl 
444 OOO ioctl 
4-20 (SIOCGIFFLAGS[| SIOCGIFMETRIC[| SIOCSIFFLAGS 
SIOCSIFMETRIC) ifioctl 4-29 case 
1. SIOCGIFLAGS[] SIOCGIFMETRIC 
410-416 SIOCGxxx ifioctl if flags[| if metric 
ifreq ifr flags 




























































































































































































ifr metric([] 4-23) 
2. SIOCSIFFLAGS 
417-429 








































































































































































































































































































if_down|| if up 


























3. IFF CANTCHAGE 
430-434 3-7 (ifp->if_flags 









































































































































96 














































































































China+pubitom 
















































































































































































































































































































































































TCP/IP 2 
IFF CANTCHANGE) (ifr-»ifr flags- 
IFF CANTCHANGE) 
ifp-»if flags if ioctl ( 
LANCE leioct1—[] 4-31) 
ifc 
410 switch (cmd) { 
411 case SIOCGIFFLAGS: 
412 ifr->ifr_flags = ifp->if_flags; 
413 break; 
414 case SIOCGIFMETRIC: 
415 ifr->ifr_metric = ifp->if_metric; 
416 break; 
417 case SIOCSIFFLAGS: 
418 if (error = suser(p->p ucred, &p->p_acflag)) 
419 return (error); 
420 if (ifp->if_flags & IFF UP && (ifr->ifr flags & IFF_UP) == 0) 
421 int s = splimp(); 
422 if_down (ifp); 
423 splx(s); 
424 } 
425 if (ifr->ifr_flags & IFF UP && (ifp->if flags & IFF UP) == 0) 
426 int s = splimp(); 
427 if_up(ifp); 
428 splx(s); 
429 } 
430 ifp->if flags = (ifp->if flags & IFF CANTCHANGE) | 
431 (ifr->ifr flags & "IFF CANTCHANGE); 
432 if (ifp->if ioctl) 
433 (void) (*ifp->if ioctl) (ifp, cmd, data); 
434 break; 
435 case SIOCSIFMETRIC: 
436 if (error = suser(p-»p ucred, &p-»p acflag)) 
437 return (error); 
438 ifp->if metric = ifr->ifr metric; 
439 break; å 
if.c 





4. SIOCSIFMETRIC 


04-29 DD ifieci [00000 









































































































































































































































































































































































































































































































































































































































































































































































































































435-439 ifioctl 
if_metric 

4.4.5 if down[] if up 

ifconfig SIOCSIFFLAGS 
IFF UP 4-30 if down[]if up 
292-302 IFF_UP 
pfctlinput(7.7[]) PRC IFDOWN 

OSI IP 

TCP[] UDP 























































































































































































































if gflush rt ifmsg TCP 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































UDP 
308-315 IFF_UP rt_ifmsg 
if.c 
292 void if. 
293 if_down(ifp) 
294 struct ifnet *ifp; 
295 ( 
296 struct ifaddr *ifa; 
297 ifp->if_flags &= “IFF_UP; 
298 for (ifa = ifp->if_addrlist; ifa; ifa = ifa->ifa_next) 
299 pfctlinput (PRC_IFDOWN, ifa->ifa addr); 
300 if_qflush(&ifp->if_snd); 
301 rt_ifmsg(ifp); 
302 ) 
308 void 
309 if_up(ifp) 
310 struct ifnet *ifp; 
311 ( 
312 struct ifaddr *ifa; 
313 ifp->if_flags |= IFF UP; 
314 rt ifmsg(ifp); 
315 3 2 
if.c 
04-30 [| [| if down [| if up 
4.4.6 SLIP 
4-29 SIOCSIFFLAGS ifioctl if ioctl 
slioctl[| loioctl ifioctl 
EINVAL 4-31 leioctl[] LANCE SIOCSIFFLAGS 
if le.c 


614 leioctl(ifp, cmd, data) 


615 struct ifnet *ifp; 


616 int 


cmd; 


617 caddr t data; 


618 ( 
619 
620 
621 
622 


623 


switch (cmd) ( 





struct ifaddr *ifa = (struct ifaddr *) data; 
struct le softc fle = &le softc[ifp-»if unit]; 
struct leregl *lerl le->sc_rl; 

int s = splimp(), error = 0; 


































































































































































































































































































AE A 


case SIOCSIFFLAGS: 


O 4-31 D [] 1eiocti [| SIOCSIFFLAGS 


98 


639 
640 
641 
642 
643 
644 
645 
646 
647 
648 
649 
650 
651 
652 
653 
654 
655 
656 








TCP/IP 2 


China-pubecom 












































if ((ifp->if_flags & IFF_UP) == 0 && 
ifp->if_flags & IFF_RUNNING) { 
LERDWR(le->sc_r0, LE STOP, lerl->lerl rdp); 
ifp->if_flags &= ~IFF_RUNNING; 
} else if (ifp->if_flags & IFF_UP && 
(ifp->if_flags & IFF_RUNNING) == 0) 
leinit(ifp-»if unit); 
/* 
* If the state of the promiscuous bit changes, the interface 
* must be reset to effect the change. 
*/ 
if (((ifp->if flags ^ le-»sc iflags) & IFF PROMISC) && 
(ifp->if flags & IFF RUNNING)) { 
le->sc iflags = ifp->if flags; 
lereset(ifp-»if unit); 
lestart (ifp); 


break; 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































672 default: 
673 error - EINVAL; 
674 H 
675 splx(s); 
676 return (error); 
677 } x 
if_le.c 
14-31 (0) 
614-623 leioctl data ifaddr ifa 
le ifp-»if unit[| le softc cmd|| switch 
638-656 4-31 case SIOCSIFFLAGS ifioctl leioctl 
( 
IFF_UP) 
IFF PROMISC IFF PROMISC 
672-677 default EINVAL 
45 DD 
LANCE 
802.3 21 IP 
( ) 
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41 [| leread 000000 Ul 1000000000 M_McAST(Ü [| M. BCAST 
UD O ether. input[] 0 O OD leread[] ether. input 0000 
000000000000 U 

42 [| ether input (0 4130 O U 000000000000 00000000 

|DOOOOOOODif0000000 eilsel | U 







































































































































































































































































































































































































































































































































































































































































































































































210 LE 
HOU 400000 i L Dui 000000 
ioctl] J Hog Ul TCP O 2913000000 
4-2 5-1 
ifnet 000 [] O 0 D 
if init leinit D D 00 D 
if output ether output looutput 000000000000 
if_start lestart D D D D D 
if done D DDD do) 
if_ioctl leioctl loioctl OOOOOODO :oct1[] 0 
if_reset lereset D DD DDD DDD 000 0 
if watchdog D D DD 0000000000 
05-1 OOOO00000000 
5.2 ODDO 
SLP D D 0 000001 U 
U U 
net/if sl SLIPO O 
net/if sl. SP 00000 
net/if loop.c 000000 
052 JOOO0000 
5.2.1 o 
Ll SLIP| 5-3 


























































































































t sl softc I] 































































































loif t ifnet 
O000000000 
sl_softel Ü ui | SLIP OD O 1oif OD U 
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ifnet SLIP 
et ) 5-4 
O O [] O O 
tk_nin DU D D D DDD O SLP D D D D D 10 0 DDD 0 
O 5-4 00 tk nin 
5.3 SLIPO O 
| SLIP 
IP SLIP 
SLIP 
LIP END 0xc0 END IP 
Oxdb Oxdc 
ESC Oxdb 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































05-5 0 D D OOOO Ser 
RFC 1055 [Romkey 1988] SLIP 
SLIP 
(PPP) SLIP 
PPP[] RFC 1332 [McGregor 199211) RFC 1548 [Simpson 
| PPP| 
B PPP 
| SLIPDISC 
SLIP 
TTY( JU Net/3 TTY (Line disci 
1/0 (U read 
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L L | | U L 0 SLIP U U U TTY 
L LU LU L 
SLIP IP o SLIP[] ifnet 
if_output [] HI SES 
SLIPDISC 
5-6 | SLIP slattach 
o SLIP TTYO 0 0 
Ut SLIP DODODO! 0 TTYI] OO [] [Leffler et al. 
198910 O 5-70 U SLIP[] [| U L L LU 
(U) 
AAA Een AAA 
Ë! U HEE IF MEAN 
=== 7] E 
ipintrq: | 
000 
U 5-6 SLIP[] 0 0 0 D 0000 0 
O O 0000/0000 [] O 
slattach ° HOO sl softe] 00000000 ifnetO D 
slinit . O D O SEP D D D 
sloutput ° OOOTTYOOOOOOOODOOOOOOO 
slioctl . D DDD ioctif 0 
sl btom . OOOOO00000000 mufl D 
slopen . 0 si softe] 0 000 TTYDOOOOOOOOOO 
slclose . O D TTYO DD si soft DD D D D 0 0 D 00 DD 0 DD 00 D 0 
sltioctl . NO TTY iocti] Ü 
slstart . . O0O00000000007YOOO00000 
slinput ° ° OOOTTYDOOOOOOOOOODOOOOOOOOOODOOOO 
057 SLIP[] H] [1 H] D] C0 D] D. Hl 
Net/3[] [] SLIP OO TCP[] LU L U 1) uti 29.13 
IU | | U 570 UU u 















































































































































Net/3 SLIP SLIP 













































































































































































UT Co 050 gnunsuenn 103 


OOO000000000000000000000000000000000 
058000000000000sSerP| JO OO00000sSere D D 0000 


sl softc[0]: f y 


E O EE a ra | 


et 



















0000 D 0000 
05-8 SLPI 00000 


[] Net/30 [] sc ttyp I t_sc[] U ttyO 00 sl softe[010 0000000 
OO0O00000000000000000000000000000000000 


0058300000000 

e00 si soft 000000000 ttyl 00O TTYO D Ú 
«DOOOOOOOOGOOOOODOOOOOOOSEPIOOODOOODO PO 
OO slinputl] [| ipintral] |] 

*OO000 if and sc fasta 00000 SLIPO I O O sistart[] D TTYO DO 
TYO0 000000000 elist 00 toproc 000000 clistd 0000 
U U 


5.3.2 SLIPO [| 0 [] slopen[] slinit 


000370000 slattach 00000 s1_softed 0000000000000 
po00000000000(000 siattachO 000 TTYD 0 (000 /dev/ttyo1g U 
0000 ioe:10 00 See o 00000000000000000 TTY0 000000 
0000000 000 siopen)Q 00000000 TrY0000000SLP000000 
OD slopen O00 5-900 


1 04 TCP/IP 2 
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if sl.c 
181 int LÆ 
182 slopen(dev, tp) 
183 dev t dev; 
184 struct tty *tp; 
185 { 
186 struct proc *p = curproc; /* XXX */ 
187 struct sl softc *sc; $ 
188 int nsl; 
189 int error; 
190 if (error = suser (p->p_ucred, &p-»p acflag)) 
191 return (error); 
192 if (tp->t_line == SLIPDISC) 
193 return (0); 
194 for (nsl = NSL, sc = sl_softc; --nsl >= 0; sc++) 
195 if (sc->sc ttyp == NULL) { 
196 if (slinit(sc) == 0) 
197 return (ENOBUFS); 
198 tp->t_sc = (caddr_t) sc; 
199 sc->sc_ttyp = tp; 
200 sc->sc_if.if_baudrate = tp->t_ospeed; 
201 ttyflush(tp, FREAD | FWRITE); 
202 return (0); 
203 } 
204 return (ENXIO); 
205 } i 
if sl.c 
0 5-9 [] O slopen 
181-193 slopen dev slopen 
tp TTY tty 
TTY SLIPDISC slopen 
194-205 for sl_softc slinit (5.10 
t sel] sc ttyp ttyl] sl_softc TTY (t ospeed) 
SLIP ttyflush TTY SLIP 
slopen ENXIO 0 
sl_softc TTY SLIP 
TTY SLIP slattach 
TTY 
5-10 slinit sl_softc 
156-175 slinit mbuf sl_softc 
SLIP sc_buf 
sc_mp sc_ep 
sl_compress_init TCP (29.13[] ) 
5-8 sc buf slinit 148 
(BUFOFFSET) 
sc mp 
sc ep 5-11 SLIP 
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IP 
6.6 
156 static int if slc 
157 slinit(sc) 
158 struct sl softc *sc; 
159 ( 
160 caddr t p; 
161 if (sc-»sc ep == (u_char +) 0) { 
162 MCLALLOC(p, M WAIT); 
163 if (p) 
164 Sc-»-sc ep = (u_char zi p + SLBUFSIZE; 
165 else ( 
166 printf("sl%d: can't allocate buffer\n", sc - sl, softc); 
167 sc->sc if.if flags &= ^IFF UP; 
168 return (0); 
169 } 
170 } 
171 sc->sc_buf = sc->sc_ep - SLMAX; 
172 SC->SC_mp = sc->sc buf; 
173 sl_compress_init (&sc->sc_comp) ; 
174 return (1); 


175 } A 
——  n[ — — ip slc 


05-10 [] [] slinit 








0 U U o 0 
MCLBYTES 2048 [] O mbuff JOD 
SLBUFSIZE 2048 000000 SLIP 000000—0 000 BPE [] 
SLIP HDRLEN 16 SLIP BPFO OOOO 
BUFOFFSET 148 00000 TCPIP 0000000000 BPF00000 
SLMAX 1900 HUUDUDUDUDBDBDUHBSLIPHUDDUDD 
SLMTU 296 scPII00000000000000000000000000 














SLIP HIWAT 100 0 TTYIOOOOOOOOOOOO 











BUFOFFSET+SLMAX=SLBUFSIZE=MCLBYTES 





05-11 SLIPO P 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































5.3.3 SLIP slinput 
TTY slinput SLIP 5-12 
slinput 
527-545 slinput e tp tty 
Ul [| tk. nin TTY U slinput[| tp->t_sc|] scl] sc 
sl softc | TTY| slinput 
slinput c TTY 
c 
SC ERROR slinput slinput END 
CLOCAL ( 
) 
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China-bubıcon 


TCP/IP 2 





















































: if sl.c 
527 void 
528 slinput(c, tp) 
529 int cr 
530 struct tty *tp; 
531 { 
532 struct sl softc *sc; 
533 struct mbuf *m; 
534 int len; 
535 int S; 
536 u_char chdr[CHDR LEN]; 
537 tk nin**; 
538 SC = (struct sl softc *) tp->t sc; 
539 if (sc == NULL) 
540 return; 
541 if (c & TTY ERRORMASK || ((tp->t state & TS CARR ON) == 0 && 
542 (tp->t_cflag & CLOCAL) == 0)) L 
543 sc->sc flags |= SC ERROR; 
544 return; 
545 } 
546 C &- TTY CHARMASK; 
547 ++sc->sc_if.if_ibytes; 
548 switch (c) { 
549 case TRANS_FRAME_ESCAPE: 
550 if (sc->sc escape) 
551 c = FRAME ESCAPE; 
552 break; 
553 case TRANS FRAME END: 
554 if (sc->sc escape) 
555 c = FRAME END; 
556 break; 
557 case FRAME ESCAPE: 
558 SC->sc escape = 1; 
559 return; 
560 case FRAME_END: 
636 } 
637 if (sc->sc_mp < sc->sc_ep) { 
638 #SC->SC_MP++ = c; 
639 sc->sc_escape = 0; 
640 return; 
641 } 
642 /* can't put lower; would miss an extra frame */ 
643 sc->sc_flags |= SC_ERROR; 
644 error: 
645 sc->sc_if.if_ierrors++; 
646 newpack: 
647 sc->sc_mp = sc->sc_buf = sc->sc_ep - SLMAX; 
648 sc->sc_escape = 0; 
649 } 

if alc 





O 5-12 [ [D slinput 
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546-636 slinput c TTY CHARMASK 
° c ESC ESC slinput ESC c 
° e END ESC slinput END c 
° c[] SLIP ESC sc_escape slinput ( ESC 
) 
° c[] SLIP END IP SLIP 
5-13 
if sl.c 
560 case FRAME END: 
561 if (sc->sc flags & SC ERROR) { 
562 sc->sc_flags &= “SC ERROR; 
563 goto newpack; 
564 } 
565 len = sc->sc_mp - sc->sc_buf; 
566 if (len < 3) Å 
567 /* less than min length packet - ignore */ 
568 goto newpack; 
569 if (sc->sc bpf) I 
570 /* 
571 * Save the compressed header, so we 
572 * can tack it on later. Note that we 
573 * will end up copying garbage in some 
574 * cases but this is okay. We remember 
575 * where the buffer started so we can 
576 * compute the new header length. 
577 */ 
578 bcopy (sc->sc_buf, chdr, CHDR_LEN); 
579 } 
580 if ((c = (*sc->sc_buf & Oxf0)) != (IPVERSION << 4)) { 
581 if (c & 0x80) 
582 c = TYPE_COMPRESSED_TCP; 
583 else if (c == TYPE UNCOMPRESSED TCP) 
584 *sc->sc_buf &= 0x4f; /* XXX */ 
585 /* 
586 * We've got something that's not an IP packet. 
587 * If compression is enabled, try to decompress it. 
588 * Otherwise, if auto-enable compression is on and 
589 * it's a reasonable packet, decompress it and then 
590 * enable compression. Otherwise, drop it. 
591 */ 
592 if (sc-»sc if.if flags & SC COMPRESS) ( 
593 len = sl uncompress tcp(&sc-»sc buf, len, 
594 (u int) c, &sc-»sc comp); 
595 if (len <= 0) 
596 goto error; 
597 } else if ((sc->sc_if.if_flags & SC_AUTOCOMP) && 
598 Cc == TYPE UNCOMPRESSED TCP && len >= 40) L 
599 len = sl_uncompress_tcp (&sc->sc_buf, len, 
600 (u int) c, &sc->sc_comp); 
601 if (len <= 0) 
602 goto error; 
603 sc->sc_if.if_flags |= SC_COMPRESS; 
604 } else 


05-13 OQ slinput [00000 


108 








TCP/IP 
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605 goto error; 
606 } p 
607 if (sc->sc_bpf) { 
608 FE 
609 * Put the SLIP pseudo-"link header". in place. 
610 * We couldn't do this any earlier since 
611 * decompression probably moved the buffer 
612 * pointer. Then, invoke BPF. 
613 XI 
614 u_char "hp = sc->sc buf - SLIP_HDRLEN; 
615 hp[SLX_DIR] = SLIPDIR_IN; 
616 bcopy(chdr, &hp[SLX CHDR], CHDR LEN); 
617 bot tap(sc-»sc bpf, hp, len + SLIP HDRLEN); 
618 ) 
619 m = sl btom(sc, len); 
620 if (m -- NULL) 
621 goto error; 
622 sc->sc_if.if_ipackets++; 
623 sc->sc_if.if_lastchange = time; 
624 s = splimp(); 
625 if (IF QFULL(&ipintrq)) { 
626 IF DROP (&ipintrg); 
627 sc->sc if.if ierrors++; 
628 sc->sc if.if igdrops++; 
629 m freem(m); 
630 ) else ( 
631 IF ENQUEUE(&ipintrq, m); 
632 Schednetisr (NETISR IP); 
633 J 
634 splx(s); 
635 goto newpack; E 
if sl.c 
418 1013 
switch switch[] ( default ) 
4 case switch 
637-649 switch IP| 
) sc escape slinput 
slinput SC ERROR 
error newpack 
sc_escape slinput 
5-13 5-12 FRAME END 
560-579 SC_ERROR 3 ( 
) slinput SLIP 
SLIP BPF[] slinput[] char ( 
) 
580-606 slinput IP 
TCP TCP| [o 



















































































































































































sl uncompress tcp 
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sl_uncompress_tcp TCP 
slinput 29.13 
607-618 SLIP|] BPF 5-14 slinput 
hp [SLX DIR] 

































































































































hp [SLX CHDR] 


CHDR, LEN 


SLIP HDRLEN 





sc->sc buf 


05-14 BPFO D D SLIP[] D 


















































| oo 99] 


-000 š 
den] [] ) 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































BPF (SLIPDIR IN) 
ap 
619-635 sl btom mbu 
sl btom but sl 
mbuf 
sl btom 
SLIP IP slinput 
) ipintrg | | | slinput newpack 
sc escape 
ipintrq SLIP if ierrors 
spltty slinput splimp 1-14 
splimp spltty 
5.3.4 SLIP sloutput 
if output 
ether out t([] 5-15) 
259-289 sloutput|] 4 SLIP ifnet 
sl_softc ) m dst 
rtp sloutput 4 
sloutput ifnet if_output 
sloutput dst IP TTY TTY 
( 
290-291 SLIP if snd 
292-295 ICMP SC NOICMP 
SLIP ICMP ECHO (J 11] ) 






























































































































































































































































110 roman 0: China-pubıcom 
OCT BEE 





259 int if slc 
260 sloutput(ifp, m, dst, rtp) 
261 struct ifnet *ifp; 
262 struct mbuf *m; 
263 struct sockaddr *dst; 
264 struct rtentry *rtp; 
265 { 
266 struct sl softc *sc = &sl softc[ifp->if unit]; 
267 struct ip *ip; 
268 struct ifqueue *ifg; 
269 int s; 
270 ja 
271 * Cannot happen (see slioctl). Someday we will extend 
272 * the line protocol to support other address families. 
273 */ 
274 if (dst->sa_family != AF_INET) ( 
275 printf("sl%d: af%d not supported\n", sc->sc_if.if_unit, 
276 dst->sa_family); 
277 m_freen (m); 
278 sc->sc if.if noproto++; 
279 return (EAFNOSUPPORT); 
280 } 
281 if (sc->sc_ttyp == NULL) { 
282 m freem(m); 
283 return (ENETDOWN); /* sort of */ 
284 } 
285 if ((sc->sc_ttyp->t_state & TS CARR ON) == 0 && 
286 (sc-»sc ttyp->t cflag € CLOCAL) == 0) { 
287 m freem(m); 
288 return (EHOSTUNREACH); 
289 } 
290 ifq = &sc->sc_if.if_snd; 
291 ip = mtod(m, struct ip *); 
292 if (sc->sc if.if flags & SC NOICMP && ip->ip_p == IPPROTO_ICMP) { 
293 m_freem(m); 
294 return (ENETRESET); /* XXX ? */ 
295 ) 
296 if (ip-»ip tos € IPTOS LOWDELAY) 
297 ifq = &sc->sc fasta; 
298 s = splimp(); 
299 if (IF QFULL(ifq)) { 
300 IF DROP (ifg); 
301 m freem(m); 
302 splx(s); 
303 sc->sc_if.if_oerrors++; 
304 return (ENOBUFS); 
305 } 
306 IF_ENQUEUE (ifa, m); 
307 sc->sc_if.if_lastchange = time; 
308 if (sc->sc ttyp->t outq.c cc == 0) 
309 slstart (sc->sc_ttyp); 
310 splx(s); 
311 return (0); 
312 } 
if_sl.c 


O 5-15 90 sloutput 









































ENETRESET ( ) 11 
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ICMP 
Net/2 0 ping[] traceroute 
ICMP | | 
| | | | | 
296-297 TOS (IPTOS LOWDELAY) 
sc fastg 
RFC 1700[] RFC 1349 [Almquist 1992][] | TOS[] Telnet 
Rlogin[] FTP( TU TFTP[] SMTP( VT DNS(UDP ) 
1[] 3.2 
BSD ip tos SLIP IP 
TOS[] [| FTP( JU] Telnet[] Rlogin TCP 
IPTOS_LOWDELAY 
ip_tos 
298-312 ( TTY 
) sloutput slstart 
SLIP if_oerrors ether_output 
(ether output)[] sloutput 
SLIP ( 
ARP)[] IP ( ) 
SLIP IP 
5.3.5 slstart 
sloutput TTY TTY 
slstart[] TTY clist 5-8 clist 
t outq slstart t oproc slstart 
t oproc 
slstart 5-16 
318-358 slstart tp tty slstart for 
t outq slstart t oproc 
TTY 100 (SLIP HIWAT) 
slstart 
TTY slstart 
TTY sc fastq sc fastaq 
if snd 
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TCP/IP 2 
SNMP TOS 353 XXX 
SLIP if_omcasts 
359-383 SLIP BPF[] slstart 
bpfbuf 
384-388 TCP sloutput sl 
compress_tcp IP (29.13 
) 
389-398 BPF SLIPDIR_OUT BPF 
bpf_tap 
483-484 for slstart 
318 void er 


319 slstart (tp) 
320 struct tty *tp; 


321 ( 
322 
323 
324 
325 
326 
327 
328 
329 
330 


331 
332 
333 
334 
335 
336 
337 
338 
339 
340 
341 
342 
343 
344 
345 
346 


347 
348 
349 
350 
351 
352 
353 
354 
355 
356 
357 
358 


struct sl_softc *sc = (struct sl_softc *) tp->t_sc; 
struct mbuf *m; 

u_char *cp; 

struct ip *ip; 


int 


s; 


struct mbuf *m2; 
u_char bpfbuf [SLMTU + SLIP_HDRLEN]; 


int 
ext 


for 


len; 
ern int cfreecount; 


Gi) L 
/* 
* If there is more in the output queue, just send it now. 
* We are being called in lieu of ttstart and must do what 
* it would. 
*/ 
if (tp->t_outq.c_cc != 0) { 
(*tp->t_oproc) (tp); 
if (tp->t_outq.c_cc > SLIP HIWAT) 
return; 
} 
/* 
* This happens briefly when the line shuts down. 
*/ 
if (sc == NULL) 


return; 
/* 
* Get a packet and send it to the interface. 
*/ 


s = splimp(); 
IF_DEQUEUE (&sc->sc_fastg, m); 
if (m) 

sc->sc_if.if_omcasts++; /* XXX */ 
else 

IF DEQUEUE(&SC-»SC if.if eng, m); 
splx(s); 
if (m == NULL) 

return; 


O 5-16 DO sistart [JT] Ht 
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359 /* 
360 * We do the header compression here rather than in sloutput 
361 * because the packets will be out of order if we are using TOS 
362 * queueing, and the connection id compression will get 
363 * munged when this happens. 
364 */ 
365 if (sc->sc_bpf) { 
366 /* 
367 * We need to save the TCP/IP header before it’s 
368 * compressed. To avoid complicated code, we just 
369 * copy the entire packet into a stack buffer (since 
370 * this is a serial line, packets should be short 
371 * and/or the copy should be negligible cost compared 
372 * to the packet transmission time). 
373 */ 
374 struct mbuf *ml = m; 
375 u_char *cp = bpfbuf + SLIP_HDRLEN; 
376 len = 0; 
377 do { 
378 int mlen = ml->m len; 
379 bcopy (mtod (ml, caddr t), cp, mlen); 
380 cp += mlen; 
381 len += mlen; 
382 } while (ml = ml->m next); 
383 ) 
384 if ((ip = mtod(m, struct ip *))-»ip p == IPPROTO TCP) { 
385 if (sc-»sc if.if flags & SC COMPRESS) 
386 *mtod(m, u_char *) |= sl compress tcp(m, ip, 
387 &sc->sc comp, 1); 
388 ) 
389 if (sc-»sc bpf) { 
390 /* 
391 * Put the SLIP pseudo-"link header" in place. The 
392 * compressed header is now at the beginning of the 
393 * mbuf. 
394 ST 
395 bpfbuf [SLX DIR] = SLIPDIR OUT; 
396 bcopy (mtod(m, caddr t), &bpfbuf [SLX CHDR], CHDR LEN); 
397 bpf_tap(sc->sc_bpf, bpfbuf, len + SLIP HDRLEN); 
398 } 
483 } 
484 } 
if sl.c 
U 5-16 (U) 
slstart (U 5-17) 
5-16 
399-409 clist 
slstart 
410-418 TTY 























































































































































































































114 





China-pubecom 























































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
slstart SLIP END 
0 SLIP IP 
— - if sl.c 
399 sc->sc_if.if_lastchange = time; 
400 /* 
401 * If system is getting low on clists, just flush our 
402 * output queue (if the stuff was important, it'll get 
403 * retransmitted). 
404 */ 
405 if (cfreecount < CLISTRESERVE + SLMTU) ( 
406 m_freem (m) ; 
407 sc->sc if.if collisions++; 
408 continue; 
409 ) 
410 /* 
411 * The extra FRAME END will start up a new packet, and thus 
412 * will flush any accumulated garbage. We do this whenever 
413 * the line may have been idle for some time. 
414 */ 
415 if (tp->t_outq.c_cc == 0) ( 
416 ++sc->sc_if.if_obytes; 
417 (void) putc (FRAME END, &tp->t outq); 
418 } < 
if_sl.c 
05-17 00 sistat [] D J HD J D I D 
5-18 Phil Karn RFC 1055 5- 
18 (END) 
END 
DUDU 



































D 1 » 1 2 O 3 
(OK) «nu» (OK) 
05-18 Kam OO SLIPD 0 D 0 0 0 U 
5-19 0 
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[] 1 » e 03 

(OK) (OK) 
WY 

n 2 
«D» 
H 5-19 D DI D D Kan O 
slstart ([] 5-20) mbu TTY 
419-467 while mbu while 
mbuf| while cp END[] ESC 
b_to_q bp[] cp END[] ESC putc 
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mbu TTY 5-21 
SLIP END SLIP ESC mbu 
bp b to q mbuf| cp ep 
mbuf| 
i if slc 
419 while (m) ( 
420 u char *ep; 
421 cp = mtod(m, u char *); 
422 ep = cp + m-»m len; 
423 while (cp « ep) ( 
424 /* 
425 * Find out how many bytes in the string we can 
426 * handle without doing something special. 
427 */ 
428 u char *bp - cp; 
429 while (cp « ep) ( 
430 switch (*cp++) { 
431 case FRAME_ESCAPE: 
432 case FRAME_END: 
433 --Cp; 
434 goto out; 
435 H 
436 } 
437 out: 
438 if (cp > bp) { 
439 pe 
440 * Put n Characters at once 
441 * into the tty output queue. 
442 */ 
443 if (b to g((char *) bp, cp - bp, 
444 &tp->t_outg)) 
445 break; 
446 sc->sc_if.if_obytes += cp - bp; 
447 } 
448 /* 
449 * If there are characters left in the mbuf, 
450 * the first one must be special.. 
451 * Put it out in a different form. 
452 */ 
453 if (cp « ep) ( 
454 if (putc(FRAME ESCAPE, &tp->t outq)) 
455 break; 
456 if (putc(*cp++ == FRAME ESCAPE ? 
457 TRANS, FRAME ESCAPE : TRANS, FRAME END, 
458 &tp-»t, outq)) L 
459 (void) unputc (&tp->t_outg) ; 
460 break; 
461 } 
462 sc->sc_if.if_obytes += 2; 
463 } 
464 } 
465 MFREE (m, m2); 
466 m = m2; 
467 } 





if_sl.c 
05-20 OO sistart [] I 000 
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OO000Ob tog OO00O0O»b tog OOO0O0Ob tog 


putc(FRAME ESCAPE, ...) putec (FRAME ESCAPE, ...) 
putc(TRANS FRAME END, ...) putc (TRANS FRAME ESCAPE, ...) 


D 5-21 D D mbu SLIPO O 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































b. to d[] putc ( TTY ) break slstart 
while clist mbuf TTY 
mbuf| m mbuf while 
mbu 
5-22 slstart 
- if sl.c 
468 if (putc(FRAME END, &tp-»t outq)) { 
469 pe 
470 * Not enough room. Remove a char to make room 
471 * and end the packet normally. 
472 * I£ you get many collisions (more than one or two 
473 * a day) you probably do not have enough clists 
474 * and you should increase "nclist" in param.c. 
475 ës 
476 (void) unputc(&tp-»t outq); 
477 (void) putc(FRAME END, &tp-»t outq); 
478 sc->sc if.if collisions++; 
479 ) else { 
480 ++8c->sc if.if obytes; 
481 sc->sc if.if opackets++; 
482 H š 
if sl.c 
05-22 DO sistart 000000 
468-482 while 
SLIP END 
END 
slstart END 
5.3.6 SLIP 
SLIP TTY SLIP 
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SLIP 
25.11 
TCP UDP 
( 5.8) 
5.3.7 SUP DO 
SLIP MTU(SLMTU)[] clist (high-water mark)(SLIP HIWAT)[] SLIP 
TOS 
1) MTU ( ) 
MTU SLIP 
40 TCP IP 
MTU 
TCP/IP RFC 1144 [Jacobson 1990a] 
9600 b/s SLIP 296 
MTU 29.13 SLIP(CSLIP) 11] 2.10 7.2 
SLIP 
2) clist[] ( SLIP HIWAT )ITOS 
SLIP TTY 
( SLIP_HIWAT ) slstart 
SLIP_HIWAT 100 
TTY slstart 100 slstart 
3) SLIP TOS sc fastg 
if snd 
5.3.8 slclose 
slclose slattach SLIP[] TTY 
210 void i slc 
211 slclose(tp) 
212 struct tty *tp; 
213 ( 
214 struct sl softc *sc; 
215 int s; 
216 ttywflush(tp); 
217 s = splimp(); /* actually, max(spltty, splnet) */ 
218 tp->t_line = 0; 
219 sc = (struct sl_softc *) tp->t_sc; 
220 if (sc != NULL) ( 
221 if_down(&sc->sc_if); 
222 sc->sc_ttyp = NULL; 
223 tp->t_sc = NULL; 


0 5-23 DI s1c1ose 
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224 MCLFREE ( (caddr_t) (sc->sc_ep - SLBUFSIZE)); 
225 sc->sc_ep = 0; 
226 sc->sc mp = 0; 
227 sc->sc buf = 0; 
228 ) 
229 splx(s); 
230 } 2 
if s.c 
U 5.223 (11) 
210-230 tp TTY slclose 
TTY TTY TTY SLIP 
mbuf] 
splx TTY | 
5.3.9 sltioctl|| 
SLIP 
° TTY 
5-7 slioctl SLIP ioctl 
4.4 ifioctl slioctl ioctl 
| 
5-7 sltioctl SLIP TTY ioctl 
sltioctl 5-24 
[] [] [] [] [] U [] [] 
SLIOCGUNIT int * sltioctl DOODOTTY0 00000000 
D 5-24 sitioctl [] [| 
sltioctl 5-25 
if sl.c 
236 int L 
237 sltioctl(tp, cmd, data, flag) 
238 struct tty *tp; 
239 int cmd; 
240 caddr t data; 
241 int flag; 
242 I 
243 struct sl softc *sc = (struct sl softc *) tp->t sc; 
244 switch (cmd) ( 
245 case SLIOCGUNIT: 
246 *(int *) data = sc-»sc if.if unit; 
247 break; 
248 default: 
249 return (-1); 
250 ) 
251 return (0); 
252 ) S 
if alc 


H 5-25 [][] sltioctl 
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5 SLIP 
236-252 tty t sc sl softc SLIP 
if unit *data (17.50 ) 
slattach if unit slattach TTY 
SLIP slopen t sc TTY SLIP s1 softc 
SLIOCGUNIT 
5.4 0000 
([] 5-26) 
if output 
=> 
clnlintrq: PIS ipintrq: | 
0526 0200092090 
if_output looutput 
IFF_SIMPLEX ether_output looutput 
12 
looutput 5-27 
EE 4i Å 
57 int Zomm: 
58 looutput (ifp, m, dst, rt) 
59 struct ifnet *ifp; 
60 struct mbuf *m; 
61 struct sockaddr *dst; 
62 struct rtentry *rt; 
63 ( ` 
64 int s, isr; 
65 struct ifqueue *ifq = 0; 
66 if ((m->m_flags & M_PKTHDR) == 0) 
67 panic("looutput no HDR"); 
68 ifp->if_lastchange = time; 
69 if (loif.if bpf) { 
70 /* 
71 * We need to prepend the address family as 
72 * a four byte field. Cons up a dummy header 
73 * to pacify bpf. This is safe because bpf 
74 * will only read from the mbuf (i.e., it won't 
75 * try to free it or keep a pointer a to it). 
76 */ 


O 5-27 DD looutput 

















120 


TCP/IP 












































China-pub.com 

































































































































































































































































































































































































































































































































































77 struct mbuf m0; 

78 u_int af = dst->sa_family; 

79 m0.m_next = m; 

80 m0.m_len = 4; 

81 m0.m data = (char +) &af; 

82 bpf mtap(loif.if bet, &m0); 

83 J 

84 m-»m pkthdr.rcvif = ifp; 

85 if (rt && rt-»rt flags & (RTF REJECT | RTF BLACKHOLE)) ( 

86 m freem(m); 

87 return (rt-»rt flags & RTF BLACKHOLE ? O : 

88 rt->rt flags & RTF HOST ? EHOSTUNREACH : ENETUNREACH); 

89 } 

90 ifp->if_opackets++; . 

91 ifp->if obytes 42 m->m_pkthär.len; 

92 switch (dst->sa family) ( 

93 case AF INET: 

94 ifg = &ipintrg; 

95 isr = NETISR_IP; 

96 break; 

97 case AF_ISO: 

98 ifq = &clnlintrg; 

99 isr = NETISR_ISO; 

100 break; 

101 default: 

102 printf("lo%d: can't handle aftd\n", ifp->if unit, 

103 dst->sa family); 

104 m freem(m); 

105 return (EAFNOSUPPORT); 

106 ) 

107 s = splimp(); 

108 if (IF QFULL(ifq)) { 

109 IF DROP(ifq); 

110 m freem(m); 

111 splx(s); 

112 return (ENOBUFS); 

113 } 

114 IF ENQUEUE(ifq, m); 

115 Schednetisr(isr); 

116 ifp->if_ipackets++; 

117 ifp->if_ibytes += m->m_pkthär.len; 

118 splx(s); 

119 return (0); 

120 } : 

if loop.c 
[ 5-27 (U) 
57-66 looutput ether output ifnet 
if output ifp ifnet m 
dst rt mbuf 
looutput panic 
5-28 BPF 

69-83 mo BPF mo mbuf 
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mo mbu mbu mO[] m data 
af 5-29 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































H looutput ` n H H mbuf 
(DUDU 0000 
O 5-29 BPFOO OOO mbuf O 
looutput a mbu bpf_mtap 
bpf_tap mbu 
BPF mbu mo ( mbuf) 
bpf_mtap 
84-89 looutput input 
m->m_pkthdr.rcvif 

looutput (RTF_REJECT) 

(RTF BLACKHOLE) mbuf| 0 
looutput EHOSTUNREACH 








































































































































































































































































































































































































































































































































































































































































































































































































































































































ENETUNREACH 
RTF xxx 18-25 
90-120 looutput sa family 
schednetisr 
55 DI 
s10 SLIP 100 
SLIP SLIP SLIP 
TOS SLIP 















































































































































































































































































































































U U 


5.1 
5.2 
5.3 
54 
53 
5.6 


5.7 


5.8 




















BE ma China-pub.eom 
CZ 5 5 ) — ila 















































































































































































































































































































































U D DD D 
ODODO 5-27 mo [] L] U D D ULU 
DO 19 200 b/s] 0000 SLIP 0000000000 SLIPMTUD D D] O 0 D 
000000000000 0 SLIP MTUJ D D H 
O [] SLIP ODO 
QO siinpguttdllüununmumgmuuggummuuututurnt sc Error] ODO 
U U 00000000 0 D 0 0 U 
O0 4-319 lef OO 0 ifp->if uniti) le softc 000000000000 
uie 
U U U D 0 0 0 0 0 0 0 0 0 UD U U UDP D D 0 0 D 0 0 U 

















Ais 


O eQ 


IP [] O 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































6.1 [I Ú 
Net/3 IP in ifaddr|] sockaddr in 
ifaddr|| sockaddr 
IP IP 
6.1.1 IP 
Internet 
IP ( ) 
IP 
IP 5 Af] BU € IP 
12 
E 
IP 
IP IP Internet 
IP 
IP (RFC 950 [Mogul and Postel 1985] 1 
IP 
127.0.0.0 A 
RFC 1122 
127.0.0.1 
127.0.0.2 
127.0.0.1 
18-2 Net/3 127.0.0.1 
6.1.2 IPOD [] 
IP 6-1 IP 


















































































































































































































































124 «mi 0 China"pub.tom 
AA tteg 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































U D U 0 O 0 O 
A 0.0.0.0] 127.255.255.255 
B 128.0.0.0[] 191.255.255.255 nn 
C 192.0.0.0[] 223.255.255.255 
D 224.0.0.0[] 239.255.255.255 m 
E 240.0.0.0[] 247.255.255.255 000 
061 DO IP 0 0 D D 
L / / B 
16/11/5) 
IP 
6-2 (1.140 ) Sun 
140 252 13 33 
`. BO DD 140.252 90108 — 001, 
00 
255 255 255 224 EST 
: e 
KH OD OD = BW e 
`. Z Ue ip o 
0000 
EE | 
140 252 13 63 
e D H 140.252 | J 0 105 ‚6000 
' ⁄ OM 4 
062 JO00POOOOO 
O[] 1 
6-31 
6.1.3 
Internet 
IP 
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Telnet SNMP 
0 0 RFC 1122 
HU 
Net/3 
ipforwarding 0 ipforwarding[] O( ) 
Net/3 u 
| IP u 
ipforwarding[] 0 Net/3 GATEWAY] 
ipforwarding 1 
6.2 UOUE 
6-3 C 
[] U [] [] 
netinet/in.h Internet] 0 O Ü 
netinet/in var.h | Internet] [| DD 
netinet/in.c Internet] [] D] 000090 
netinet/if.c Internet] [] U D U Ü 
063 UHHHHHNn 






































































































































in ifaddr struct in ifaddr in ifaddr[| 000000 
in interfaces int OPOOOOOOO 


064 000000200090 














63 0000000 
































































































































































































































































































































































































































































































































































































































































































































6-5 
6-5 SLIP 
IP SLIP 
IP IP OSI 
IP in ifaddr| ifnet addrs 
I [] 6-5 | ELE] ifaddr o ifa ifpl] 
ifaddr ifnet 
6-5 IP| ioctl 
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ifnet: 





ifnet_addrs: 





OM in ifadar()Q 
OO rader OD | 


in ifaddr: 







le softc[0] : 


in 1faddr() 


in ifa 


6.4 sockaddr_in|]| || 






















































































ddr() 


ifnet {} 


ifaddr() 


sockaddr_d1{} 
sockaddr dl() 


in ifaddr() 
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Sl softc[0]: 












065 nüupnaanpaund 


















































































































loif: 


ifaddr() 


in ifaddr() 


iso ifaddr() 


sockaddr dl() 


sockaddr dl() 


ifaddr() 
j 



































































































































































































































































































































































































































































































AF_INET 












































































































































sin_addr 
























































3 sockaddr[] ifaddr IP 
Sockaddr in||in ifaddr Internet Sockaddr in 
68-70 Net/3 Internet in addr 
s addr Net/3 
106-112 sin len 16( Sockaddr in ) sin family 
sin port ( JO 16 bit 
32 bit Internet 
6-6 Sockaddr in sin port[] sin addr[] sin zero 






















































































Sockaddr 
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sa_data Internet sin_zero 0 2.70) 
sockaddr in sockaddr 
7 in.h 
68 struct in addr ( 
69 . wu long s_addr; /* 32-bit IP address, net byte order */ 
70 ); 


106 struct sockaddr in ( 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































107 u char sin len; /* sizeof (struct sockaddr in) = 16 */ 
108 u char sin family; /* AF INET */ 
109 u short sin port; /* 16-bit port number, net byte order */ 
110 struct in addr sin addr; 
111 char sin zero[8]; /* unused */ 
112 }; . 
in.h 
O 6-6 U U sockaddr in 
Internet u long 
in addr (O 6-7) s addr 
family 
sockaddr{} en] data 
family 14 bytes 
PE addr | 
sockaddr in() =E port in_addr() zero 
4 bytes 8 bytes 
u long addr.s addr 
4 bytes 
[16-7 00 sockaddr in [0 (00 sn 10 H 
6.5 in ifaddr[|[] 
6-8 Internet IP 
in ifaddr IP (U 6-5) 
41-45 in ifaddr ia ifa IP ifaddr 
3-15 ia_ifpll ia flags ifaddr 
ia nezt Internet 
ifaddr in_ifaddr 
46-54 ( ia_multiaddrs) 6-9 B 
sun u_long in_addr 
sockaddr_in sun PPP 
PPP[] SLIP 
55=56 in ifaddr in multi (12.6[] ) 









































































































































IP 
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3 








in var.h 
41 struct in ifaddr ( 
42 struct ifaddr ia ifa; /* protocol-independent info */ 
43 #define ia ifp ia ifa.ifa ifp 
44 #define ia flags ia ifa.ifa flags 
45 struct in ifaddr *ia next; /* next internet addresses list */ 
46 u long ia net; /* network number of interface */ 
47 u long ia netmask; /* mask of net part */ 
48 u long ia subnet; /* subnet number, including net */ 
49 u_long ia_subnetmask; /* mask of subnet part */ 
50 struct in addr ia netbroadcast; /* to recognize net broadcasts  */ 
51 struct sockaddr in ia addr; /* space for interface name * 7 
52 struct sockaddr_in ia_dstaddr; /* space for broadcast addr * / 
53 #define ia broadaddr ia dstaddr 
54 struct sockaddr_in ia_sockmask; /* space for general netmask */ 
55 struct in multi *ia_multiaddrs; /* list of multicast addresses */ 
56 y; 

in_var.h 


0 6-8 [| [| in ifaddr 


















































































































sockaddr_in 



































D DDD DD 00 U 















































140.252.13.33 140.252.1.29 






















































































































































































ia net u long MNA 
140.252.0.0 140.252.0.0 127.0.0.0 m 

ia netmask u long Si et EI 
255.255.0.0 255.255.0.0 255.0.0.0 = 

ia subnet u, long D ti E 





















































































































































: E 
1402521332 140.252.1.0 1270.00 


255.255.255.224 255.255.255.0 255.0.0.0 














































































































ia_netbroadcast |in_addr [ amm a as: RA 


140.252.255.255 140.252.255.255 127.255.255.25| "Y 














ia_broadaddr sockaddr_in [ T HM ONE 


140.252.13.63 LU U U U U LI 














ia dstaddr sockaddr in 





140.252.1.183 


ia sockmask sockaddr_in : 
ia subnetmask 








255.255.255.224 255.255.255.0 255.0.0.0 


























Om 
| 




































































































































































































































































































































































































































































DU D B B B U 
06-9 sul 00000 PPPO UO inifasr 00 
6.6 0000 
4 Internet 
IP Net/3 ifconfig 
ifconfig ioctl 
/etc/netstart shelll 
6-10 ioctl 
( UDP OSI ) IP ioctl 
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UDP[] U 

Oo E U U U U U Ë 
SIOCGIFADDR struct ifreq * in_control 00000 
SIOCGIFNETMASK struct ifreg * in_control 000000 
SIOCGIFDSTADDR struct ifreq + in control 0000000 
SIOCGIFBRDADDR struct ifreg * in_control 000000 
SIOCSIFADDR struct ifreg * in_control 00000 
SIOCSIFNETMASK struct ifreg * in_control 0020000000 
SIOCSIFDSTADDR struct ifreg * in control 0000000 
SIOCSIFBRDADDR struct ifreg * in_control 0000000 
SIOCDIFADDR struct ifreq + in control 000000 
SIOCAIFADDR struct in aliasreg |* in control 00000 

O 6-10 QQ ioctl OO 










mn! < 
Ya 


u Hau 


if ioctl 





06-11 000000 ieee D D 
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FRE RE H 


































































































































































































































































































































































































SIOCG SIOCS SIOC 
socket ioctl[] G get S set 
4 0 sy 0 | ioctl 6-10 | 
| | LU 0 | 6-11 
ioctl 








































































































6.6.1 ifioctl 




























































































































































































































































































































































































































































































































































































































































































































































































































































































6-11 ifioctl ioctl pr_usrreq 
udp_usrreq in_control in_control 
TCP in_control 
6-12 l ifioctl default 4-220 0 
447 default: ifc 
448 if (so->so_proto == 0) 
449 return (EOPNOTSUPP); 
450 return ((*so->so_proto->pr_usrreq) (so, PRU CONTROL, 
451 cmd, data, ifp)); 
452 1 å 
453 return (0); 
454 ) š 
if.c 
06-12 ID ificett 00000000 
447-454 6-10 ioctl 
UDP [] udp_usrreg[] 23.10 | udp_usrreq 
udp_usrreq PRU_CONTROL 
if (req == PRU_CONTROL) 
return (in_control(so, (int)m, (caddr_t)addr, (struct ifnet *)control)); 











6.6.2 in_control 















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































6-11 soo_ioctl default[] ifioctl 
in_control udp usrreq in control 
in control 6-13 in control 
132-145 so ioctl ( cmd ) data 
([] 6-10 ) ifp ( soo_ioctl 
ioctl) ifreq|| in aliasreq ( 3fioctl ioctl) 
in control ifr|| ifra ifreq[] in aliasreq[][][] data 
146-152 ifp ifnet for g Internet 
ia in_ifaddr ia 
ifp cmd switch switch 
switch default ifp EOPNOTSUPP 
153-330 in control switch switch 
LU LU U U U 
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in.c 
































132 in control(so, cmd, data, ifp) 
133 struct socket *so; 

134 int cmd; 

135 caddr t data; 

136 struct ifnet *ifp; 


137 I 

138 struct ifreq *ifr = (struct ifreq +) data; 

139 struct in ifaddr *ia = 0; 

140 struct ifaddr *ifa; 

141 struct in ifaddr *oia; 

142 struct in_aliasreg *ifra = (struct in aliasreg +) data; 
143 struct sockaddr in oldaddr; 

144 int error, hostIsNew, maskIsNew; 

145 u long i; 

146 /* 

147 * Find address for this interface, if it exists. 
148 * 

149 ` if (ifp) 

150 for (ia = in_ifaddr; ia; ia = ia->ia next) 
151 if (ia->ia_ifp == ifp) 

152 break; 

153 switch (cmd) { 





218 } 
219 switch (cmd) { 





326 default: 


327 if (ifp == 0 || ifp->if_ioctl == 0) 

328 return (EOPNOTSUPP); 

329 return ((*ifp->if ioctl) (ifp, cmd, data)); 
330 } 

331 return (0); 

332 } 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































O 6-13 [ [] in control 
switch default ifp 
if ioctl in control|| ioctl 
Net/3 default 
ioctl case 
331=332 switch 
switch in control 0 switch case 
ioctl 
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6.6.3 SIOCSIFADDR[] SIOCSIFNETMASK[] SIOCSIFDSTADDR 
6-14 SIOCSIFADDR|| SIOCSIFNETMASK|| SIOCSIFDSTADDR 
166 case SIOCSIFADDR: 
167 case SIOCSIFNETMASK: 
168 case SIOCSIFDSTADDR: 
169 if ((so->so_state & SS_PRIV) == 0) 
170 return (EPERM); 
171 if (ifp == 0) 
172 panic("in control"); 
173 if (ia == (struct in ifadår +) 0) I 
174 oia = (struct in ifaddr *) 
175 malloc(sizeof *oia, M IFADDR, M_WAITOK); 
176 if (oia == (struct in ifaddr *) NULL) 
177 return (ENOBUFS); 
178 bzero((caddr t) oia, sizeof *oia); 
179 if (ia = in ifaddr) { 
180 for (; ia->ia next; ia = ia->ia next) 
181 continue; 
182 ia->ia next = oia; 
183 ) else 
184 in ifaddr = oia; 
185 ia = oia; 
186 if (ifa = ifp->if addrlist) { 
187 for (; ifa->ifa next; ifa = ifa->ifa next) 
188 continue; 
189 ifa->ifa next = (struct ifaddr *) ia; 
190 } else 
191 ifp->if_addrlist = (struct ifaddr *) ia; 
192 ia->ia_ifa.ifa_addr = (struct sockaddr *) &ia->ia addr; 
193 ia->ia ifa.ifa dstaddr 
194 = (struct sockaddr *) &ia->ia dstaddr; 
195 ia->ia ifa.ifa netmask 
196 = (struct sockaddr *) &ia->ia sockmask; 
197 ia->ia sockmask.sin len = 8; 
198 if (ifp->if flags & IFF BROADCAST) ( 
199 ia->ia broadaddr.sin len = sizeof(ia-»ia addr); 
200 ia->ia broadaddr.sin family = AF INET; 
201 ) | 
202 ia->ia ifp = ifp; 
203 if (ifp != &loif) 
204 in interfaces++; 
205 } 
206 break; 


O 6-14 DO in control [D D] UU Ú] 


switch switch 
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in.c 


in.c 
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166-172 in 
control EPERM panic ifioctl 
(O 4-22) panic 
socreate([] 15-16) SS_PRIV 
ID ID 
ioctl 
2. 
173-191 ia in_control in_ifaddr 
bzero | 









































































































































in_ifaddr 























if_addrlist 
3. 



























































192-206 







































ifaddr{} 






in_ifaddr{} 









































in_ifaddr 

















ifaddr 

































































in ifaddr 
























































sockaddr_in 



































ia sockmask 





0 6-15 [ in contro [IO O UJ O O inifaddr OQ 


































































































































































































































































































































































































































































































































































































ia broadaddr 6-15 
in ifaddr 
202-206 in control in ifaddr ifnet 
Net/3[] in interfaces 
6.6.4 [] SIOCSIFADDR 
ia SIOCSIFADDR in_ifaddr 
6-16 in_control switch|] |] 
in.c 
259 case SIOCSIFADDR: 
260 return (in ifinit(ifp, ia, 
261 (struct sockaddr in *) &ifr->ifr addr, 1)); ` 
in.c 
D 6-16 QQ in control 00000 























159-261 in_ifinit 















































IP ifreg (ifr_addr) 










































































in_ifinit 








6.6.5 in_ifinit 












































3n a Fa nate 
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. 
. 
Š ( ) 
° 
6-17 
393-337 in SÆR ALE ifp la 
in_ifaddr sin IP scrub 
i IP 
Ee I E in.c 
353 in ifinit(ifp, ia, sin, scrub) 
354 struct ifnet *ifp; 
355 struct in ifaddr *ia; 
356 struct sockaddr in *sin; 
357 int scrub; 
358 ( 
359 vu long i = ntohl(sin-»sin addr.s addr); 
360 struct sockaddr in oldaddr; 
361 int S - splimp(), flags - RTF UP, error, ether output(); 
362 oldaddr = ia->ia_addr; 
363 ia->ia addr = *sin; 
364 /* 
365 * Give the interface a chance to initialize 
366 * if this is its first address, 
367 * and to validate the address if necessary. 
368 */ 
369 if (ifp->if ioctl && 
370 (error = (*ifp-»if ioctl) (ifp, SIOCSIFADDR, (caddr t) ia))) { 
371 splx(s); 
372 ia->ia addr = oldaddr; 
373 return (error); 
374 ) 
375 if (ifp->if output == ether output) ( /* XXX: Another Kludge */ 
376 ia->ia ifa.ifa rtrequest = arp rtrequest; 
377 ia->ia ifa.ifa flags |= RTF CLONING; 
378 ) 
379 splx(s); 
380 if (scrub) ( 
381 la->ia_ifa.ifa_addr = (struct sockaddr +) &oldaddr; 
382 in_ifscrub(ifp, ia); 
383 ia->ia ifa.ifa addr = (struct sockaddr +) &ia->ia_addr; 
384 } : i 
In.c 
06-17 00 in ifinit 00000000000 
1. 
358-374 in control | oldaddr [] 
if ioctl in control 





















































































































































































































































leioctl|| slioctl[| loioctl 




















in_control 


2: 

























































































































































































375=378 arp rtrequest 






































RTF CLONING arp. rtrequest[] 21.13 RTF CLONING[] 19.4 
















































































Chinapubscon arno 135 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































XXX 
3. 
379-384 ifa_addr 
in_ifscrub in_ifscrub 
in_ifinit 6-18 
: in.c 
385 if (IN CLASSA(i)) 
386 ia-»ia netmask - IN CLASSA NET; 
387 else if (IN CLASSB(i)) 
388 ia->ia netmask - IN CLASSB NET; 
389 else 
390 ia->ia_netmask = IN CLASSC NET; 
391 /* 
392 * The subnet mask usually includes at least the standard network part, 
393 * but may may be smaller in the case of supernetting. 
394 * If it is set, we believe it. 
395 */ 
396 if (ia->ia_subnetmask == 0) { 
397 ia->ia subnetmask = ia->ia_netmask; 
398 ia->ia sockmask.sin addr.s addr = htonl (ia->ia_subnetmask) ; 
399 } else 
400 ia->ia_netmask &= ia->ia_subnetmask; 
401 ia->ia net = i & ia->ia_netmask; 
402 ia->ia subnet = i & ia->ia subnetmask; 
403 in socktrim(&ia->ia sockmask) ; ` 
m.c 
16-18 QQ in ifinit 00000000 
4. 
385-400 A B C ia netmask 
ia subnetmask||ia sockmask 
ia netmask 
in ifinit 
1 bit( 
0 bit 0 0) 
1 bit 
RFC 1519 [Fuller et al. 1993] 
A B C 1[] 10.8 
( ) ( 
SIOCSIFNETMASK[| SIOCAIFADDR) ( ) 
5. 
401-403 in_socktrim 
1 bit in_sockmask( sockaddr_in ) 
6-19 in_ifinit 
6. 





























































































































404-422 in_control 
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in_ifaddr 
IP 
in_control 
in_ifinit|| flags RTF_UP RTF_HOST 

rtindt ( RTF HOST) ( RTF HOST) 
rtinit ia flags IFA ROUTE 

AA 

404 /* 

405 * Add route for the network. 

406 XI 

407 ia->ia_ifa.ifa_metric = ifp->if_metric; 

408 if (ifp->if_flags & IFF_BROADCAST) { 

409 ia->ia broadaddr.sin addr.s addr = 

410 htonl(ia->ia subnet | ^ia-»ia subnetmask); 

411 ia->ia netbroadcast.s addr = 

412 htonl(ia->ia net | "ia-»ia netmask); 

413 ) else if (ifp->if flags & IFF LOOPBACK) { 

414 ia-»ia ifa.ifa dstaddr = ia->ia ifa.ifa addr; 

415 flags |= RTF HOST; 

416 ) else if (ifp->if flags & IFF POINTOPOINT) ( 

417 if (ia->ia dstaddr.sin family != AF INET) 

418 return (0); 

419 flags |- RTF. HOST; 

420 } : 

421 if ((error = rtinit(&(ia-»ia ifa), (int) RTM ADD, flags)) == 0) 

422 ia-»ia flags |- IFA ROUTE; 

423 pe 

424 * If the interface supports multicast, join the "all hosts" 

425 * multicast group on that interface. 

426 */ 

427 if (ifp->if_flags & IFF_MULTICAST) { 

428 struct in_addr addr; 

429 addr.s addr = htonl(INADDR ALLHOSTS GROUP); 

430 in addmulti(&addr, ifp); 

431 J 

432 return (error); 

433 ) 


06-19 QQ in ifinit DODODOO 


















































































































































































































































































































































































































































7. 
423-433 
in_addmulti 12.11 
6.6.6 | SIOCSIFNETMASK 
6-20 
in.c 
262 case SIOCSIFNETMASK: 
263 i = ifra->ifra_addr.sin_addr.s_addr; 
264 ia->ia subnetmask = ntohl (ia->ia_sockmask.sin_addr.s_addr = i); 
265 break; . 
in.c 





1620 []H an eontrel. 100000 
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262-265 in_control|l|ifreg 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ia sockmask ia subnetmask 
6.6.7 | UO] | [| SIOCSIFDSTADDR 
SIOCSIFDSTADDR 6-14 
6-21 
in.c 
236 case SIOCSIFDSTADDR: 
237 if ((ifp->if_flags & IFF_POINTOPOINT) == 0) 
238 return (EINVAL); 
239 oldaddr = ia->ia_dstaddr; 
240 ia->ia dstaddr = *(struct sockaddr in *) &ifr->ifr_dstaddr; 
241 if (ifp->if ioctl && (error = (*ifp->if ioctl) 
242 (ifp, SIOCSIFDSTADDR, (caddr t) ia))) { 
243 ia->ia dstaddr = oldaddr; 
244 return (error); 
245 ) 
246 if (ia-»ia flags & IFA ROUTE) { 
247 ia-»ia ifa.ifa dstaddr = (struct sockaddr *) &oldaddr; 
248 rtinit(&(ia-»ia ifa), (int) RTM DELETE, RTF HOST); 
249 ia-»ia ifa.ifa dstaddr = 
250 (struct sockaddr +) &ia->ia dstaddr; 
251 rtinit(&(ia-»ia ifa), (int) RTM ADD, RTF HOST | RTF UP); 
252 } 
253 break; í 
in.c 
0 6-21 QQ in contra 0000000 
236-245 in_control EINVAL 
oldaddr if_ioctl 
246-253 rtinit 
rtinit 
6.6.8 
6-22 SIOCSIFBRDADDR 
ioctl 
. in.c 
207 case SIOCSIFBRDADDR: 
208 if ((so->so state & SS PRIV) == 0) 
209 return (EPERM); 
210 /* FALLTHROUGH */ 
211 case SIOCGIFADDR: 
212 case SIOCGIFNETMASK: 
213 case SIOCGIFDSTADDR: 
214 case SIOCGIFBRDADDR: 
215 if (ia == (struct in_ifaddr *) 0) 
216 return (EADDRNOTAVAIL); 
217 break; I 
in.c 


DH 6-22 QQ incontrol 0000000 





138 
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TCP/IP 2 
207-217 SIOCSIFBRDADDR 
4|] SIOCGXXX ia 
(ia[] in control 6-13) ia EADDRNOTAVAIL 
5 (4[] get set ) 6-23 
in.c 
220 case SIOCGIFADDR: 
221 *((struct sockaddr_in *) &ifr->ifr_addr) = ia->ia_addr; 
222 break; 
223 case SIOCGIFBRDADDR: 
224 if ((ifp->if_flags & IFF BROADCAST) == 0) 
225 return (EINVAL); 
226 *((struct sockaddr in *) &ifr->ifr_dstaddr) = ia->ia broadaddr; 
227 break; 
228 case SIOCGIFDSTADDR: 
229 if ((ifp->if flags & IFF POINTOPOINT) == 0) 
230 return (EINVAL); 
231 *((struct sockaddr_in *) &ifr->ifr_dstaddr) = ia->ia_dstaddr; 
232 break; 
233 case SIOCGIFNETMASK: 
234 *((struct sockaddr in *) &ifr->ifr_addr) = ia->ia_sockmask; 
235 break; 
254 case SIOCSIFBRDADDR: 
255 if ((ifp->if_flags & IFF_BROADCAST) == 0) 
256 return (EINVAL); 
257 ia->ia broadaddr = *(struct sockaddr in *) &ifr->ifr broadaddr; 
258 break; 
me n; 
[] 6-23 QQ in control JOD 
220-235 ifreq 
254-258 ifreq 
6.6.9 [| IP] 
SIOCGxxx[] SIOCSxxx IP —— [| in control 
(0 6-25) IP 
SIOCAIFADDR SIOCAIFADDR SIOCGXXX 
SIOCSxxx ifconfig SIOCAIFADDR 
IP 
Net/3[] ifconfig alias in aliasreq 
6-24 
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; : in var.h 
59 struct in aliasreq ( 
60 char ifra name[IFNAMSIZ]; /* interface name, e.g. "en0" */ 
61 struct sockaddr in ifra addr; 
62 struct sockaddr in ifra broadaddr; 
63 #define ifra dstaddr ifra broadaddr 
64 struct sockaddr in ifra mask; 


65 }; . 
$$ in var.h 


06-24 DU in aliasreg 





























































































































































































































































































































































































































































































































































































































































































































59-65 ifreq in aliasreq 
ioctl SIOCAIFADDR 
SIOCAIFADDR SIOCDIFADDR 
IP in ifaddr 6-25 SIOCAIFADDR|| SIOCDIFADDR 
in control(l[] 6-13) i a 
ifra name( ) IP 
in.c 
154 case SIOCAIFADDR: 
155 case SIOCDIFADDR: 
156 if (ifra->ifra_addr.sin_family == AF_INET) 
157 for (oia = ia; ia; ia = ia->ia_next) { 
158 if (ia->ia_ifp == ifp && 
159 ia->ia addr.sin addr.s addr == 
160 ifra->ifra addr.sin addr.s addr) 
161 break; 
162 3 
163 if (cmd == SIOCDIFADDR && ia == 0) 
164 return (EADDRNOTAVAIL); 
165 /* FALLTHROUGH to Figure 6.14 */ 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































0 6-25 QQ in contra po000000 

154-165 SIOCDIFADDR *ifra 6-25 

SIOCAIFADDR([] ifra in aliasreg JH SIOCDIFADDR([] ifra 

ifreq ) in_aliasreqll ifreq 

in_control for ifra- 
>ifra_addr IP in_ifaddr 
EADDRNOTAVAIL 
6-14 
6-14 in aliasreq 
in ifaddr 

















































































































































































































































































































































































































6.6.10 IP SIOCAIFADDR 
ia in ifaddr IP 

in ifaddr SIOCAIFADDR| 6-26 

266-277 SIOCAIFADDR 

maskIsNew|| hostIsNew 
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TCP/IP 
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in.c 

266 case SIOCAIFADDR: 

267 maskIsNew = 0; 

268 hostIsNew = 1; 

269 error = 0; 

270 if (ia->ia_addr.sin_family == AF_INET) { 

271 if (ifra->ifra_addr.sin_len == 0) { 

272 ifra->ifra_addr = ia->ia_addr; 

273 hostIsNew = 0; 

274 } else if (ifra->ifra_addr.sin_addr.s_addr == 

275 ia->ia addr.sin addr.s addr) 

276 hostIsNew = 0; 

277 ) 

278 if (ifra->ifra mask.sin len) ( 

279 in ifscrub(ifp, ia); 

280 ia->ia sockmask = ifra->ifra mask; 

281 ia->ia subnetmask = 

282 ntohl (ia->ia_sockmask.sin_addr.s_addr); 

283 maskIsNew = 1; 

284 } 

285 if ((ifp->if_flags & IFF_POINTOPOINT) && 

286 (ifra->ifra_dstaddr.sin_family == AF INET)) { 

287 in ifscrub(ifp, ia); 

288 ia->ia dstaddr = ifra->ifra dstaddr; 

289 maskIsNew = 1; /* We lie; but the effect's the same */ 

290 ) 

291 if (ifra->ifra addr.sin family == AF INET && 

292 (hostIsNew || maskIsNew)) 

293 error = in ifinit(ifp, ia, &ifra->ifra addr, 0); 

294 if ((ifp->if flags & IFF BROADCAST) && 

295 (ifra->ifra broadaddr.sin family == AF INET)) 

296 ia->ia broadaddr = ifra->ifra broadaddr; 

297 return (error); A 
1n.c 

[]6-26 UU in control [| SIOCAIFADR TU 
IP (hostIsNew[] I ) 
O[] in control hostIsNew 0 0 
hostIsNew 0 
278-284 
in_control 
285-290 in_scrub 

























































































































































































in_ifinit 





















































maskIsNew 





































































































































































































































































































































































































































































































291-297 in_ifinit 
(U 6-17) in_ifinit 0 
in_aliasreq 
6.6.11 IP SIOCDIFADDR 
SIOCDIFADDR IP 6-27 ia 
in ifaddr ( ) 
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298 case SIOCDIFADDR: en 

299 in ifscrub(ifp, ia); 

300 if ((ifa = ifp->if addrlist) == (struct ifaddr *) ia) 

301 /* ia is the first address in the list */ 

302 ifp->if addrlist = ifa->ifa next; 

303 else ( 

304 /* ia is *not* the first address in the list */ 

305 while (ifa->ifa next && 

306 (ifa->ifa next != (struct ifaddr *) ia)) 

307 ifa = ifa->ifa next; 

308 if (ifa->ifa next) 

309 ifa->ifa next = ((struct ifaddr *) ia)->ifa next; 

310 else 

311 printf("Couldn't unlink inifaddr from ifp\n"); 

312 ) 

313 oia = ia; 

314 if (oia == (ia = in ifaddr)) 

315 in_ifaddr = ia->ia_next; 

316 else { 

317 while (ia->ia_next && (ia->ia_next != oia)) 

318 ia = ia->ia_next; 

319 if (ia->ia_next) 

320 ia->ia next = oia->ia_next; 

321 else 

322 printf("Didn’t unlink inifadr from list\n"); 

323 } 

324 IFAFREE ( (&oia->ia_ifa)); 

325 break; I 
nc 


0 6-27 in control [000000 




































































298-323 ia in ifscrub 






































































































































if if Internet 











































































































(in ifaddr) 
324-325 IFAFREE 0 


































































































































































































6.7 Dl ioct1[] [] 

































































ioctl 





















































































































































leioctl[|slioctl[| loioctl 
in ifinit 6-16 SIOCSIFADDR 6-26 SIOCAIFADDR 
in ifinit if ioctl SIOCSIFADDR (0 6-17) 












































































































































































































































6.7.1 leioctl 




































































































































































4-31 LANCE SIOCSIFFLAGS 6-28 
SIOCSIFADDR 
614-637 data ifaddr ifp->if_unit 



































































































































le_softc 









































































































































leinit Internet IP arpcom 
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ARP ARP[] 21.5 1[] 4.7 
627-677 EINVAL 
- - if le.c 

614 leioctl(ifp, cmd, data) 

615 struct ifnet *ifp; 

616 int cmd; 

617 caddr t data; 

618 ( f 

619 struct ifaddr *ifa = (struct ifaddr *) data; 

620 struct le_softc *le = &le_softc[ifp->if_unit]; 

621 struct leregl *lerl = le-»sc r1; 

622 int s = splimp(), error = 0; 

623 switch (cmd) { 

624 case SIOCSIFADDR: 

625 ifp->if_flags |= IFF UP; 

626 switch (ifa-»ifa addr->sa family) ( 

627 case AF INET: 

628 leinit(ifp->if unit): /* before arpwhohas */ 

629 ((struct arpcom *) ifp)-»ac ipaddr = 

630 IA SIN(ifa)-»sin addr; 

631 arpwhohas ( (struct arpcom *) ifp, &IA SIN(ifa)-»sin addr); 

632 break; 

633 default: 

634 leinit (ifp->if_unit); 

635 break; 

636 } 

637 break; 

u pues 1 m å = 

672 default: 

673 error = EINVAL; 

674 } 

675 splx(s); 

676 return (error); 

677 } 
if_le.c 

O 6-28 [ [| leioctl 
6.7.2 slioctl 
slioctl([] 6-29)[] SLIP SIOCSIFADDR|| SIOCSIFDSTADDR 

if sl.c 





653 int 
654 slioctl(ifp, cmd, data) 
655 struct ifnet *ifp; 


656 int cmd; 

657 caddr t data; 

658 { 

659 struct ifaddr *ifa = (struct ifaddr *) data; 
660 struct ifreq *ifr; 

661 int s = splimp(), error = 0; 

662 switch (cmd) ( 


06-29 UU slioctid [] O [| SIOCSIFADDR [| SIOCSIFDSTADDR 
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663 case SIOCSIFADDR: 

664 if (ifa->ifa_addr->sa_family == AF_INET) 
665 ifp->if_flags |- IFF UP; 

666 else 

667 error = EAFNOSUPPORT; 

668 break; 

669 case SIOCSIFDSTADDR: 

670 if (ifa->ifa_addr->sa_family != AF_INET) 
671 error = EAFNOSUPPORT; 

672 break; 























































































































































































































































































































































































































688 default: 
689 error = EINVAL; 
690 } 
691 splx(s); 
692 return (error); : 
693 } S 
if sl.c 
[] 6-29 (0) 
663-672 IP EAFNOSUPPORT 
SIOCSIFADDR IFF UP 
688-693 EINVAL 
6.7.3 loioctl 
loioctl SIOCSIFADDR 6-30 
135 int ifloop.c 
136 loioctl(ifp, cmd, data) 
137 struct ifnet *ifp; 
138 int cmd; 
139 caddr_t data; 
140 { 
141 struct ifaddr Fifa; 
142 struct ifreq *ifr; 
143 int error = 0; 
144 switch (cmd) { 
145 case SIOCSIFADDR: 
146 ifp->if flags |= IFF UP; 
147 ifa = (struct ifaddr *) data; 
148 /* 
149 * Everything else is done at a higher level. 
150 e 
151 break; 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































O 6-30 [ [| loioct1 [ O [| SIOCSIFADDR 
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167 default: 
168 error = EINVAL; 
169 } 
170 return (error); 
171 } 
if_loop.c 
[ 6-30 (0) 
135-151 Internet loioctl IFF UP L 
167-171 EINVAL 
LU U U U U U | 00000000 (rr op 
6.8 Internet] 11 [| 
6-31[] U U Internet [] 6-5] ifnet 
O O 32 bit IPH E] E] E] E] E] E]. E] 0 0 0 0 0 0 0 0 
netinet/in.c[][] 0 Ul 
[] U U U 
in netof in] 00000000000000000 0000D000000D0000 




















00000000 

u_long in_netof (struct in_addr in); 

OOO m) 160 D D 0.0 D D D.D D D D D DU D 50 D 0000000000 
000000000090 

int in canforward(struct in_addr in); 

in_localaddr D 0 0 0 o D D DD DDD DD 00000 D D D D D D DU Osubnetsarelocal 
00 000000000000000000000 

int in localaddr(struct in addr in); 

in broadcast 002 D D D œD D 0 0 0 D 0 0 0 D 0000000 0 


int in_broadcast (struct in_addm, struct ifnetifp); 





in_canforward 












































[] 6-31 Internet] O DD 






































































































































































































































































































































Net/2[] in canforward | | 0 
Net/2 | 127.0.0.1[] Net/2 | 
( 127.0.0.2)[] 
127.0.0.2[] telnet[] [] ¢ 6.6) 








































































































6.9 ifnet | O00 


































































































































































































































































































































































































U U U U 6-5 | 0 O 6-32 U U 
0 sockaddr[] |] 0 g [| 6-31 
0 0 32 bit[] IP O 0 DI 
net/if.c 
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0 HU D B 
ifa ifwithaddr 0ifnoet0 00000000000000 add D 0 0 D D D D 000 D 


000 ifaaar D 0 DD D DD 00000 000000000 
struct ifaddr ifa ifwithaddr(struct sockaddradir); 
ifa ifwithdstaddr DifnetUDDOUDDODUD aaa 000000000000000 
ifaddr J0O0000000000000000000 
struct ifaddr *ifa ifwithdstaddr(struct sockaddr atldr); 
ifa ifwithnet Difnet 00000 add H H 0 0 H H H U 0 åfader IO OD 
O00000000000000000 
struct ifaddr ifa_ifwithnet (struct sockaddraddr); 
ifa ifwithaf D ifnet([NNO0004ddQ0000000000000000000 
ifaddecJOOO0000000000000000000 
struct ifaddr ifa ifwithaf(struct sockaddradür); 
ifaof ifpforaddr DU pD D D D D D «aa D 0000000 0000000000000 
O0000000000000000000000000000000 
000000 ifaderQOOO0000000000000000000 
structifaddr * ifaof ifpforaddstruct sockaddr *addr, 
struct ifnet if); 


ifa_ifwithroute 000000 Gog D D DUDU (gateway O0 0000000000 ifadar[] 
0000 


struct faddr ifa ifwithroute(intflags, struct 





























U 
00 








sockaddr dst, struct sockaddrgateway); 


ifunit O00 name] 00 ifnetJ 0000 


struct ifnet Afunit(char Rame); 


O 6-32 ifnet ID D] Ü] 




















0000000000 PO D 0 0 D 0 0 D D PODO DO D 0 0 D 0 DD 00000 






















































































































































































































































































































































































































































































OD in ifaddr[] sockaddr_in 
00000000000 ifconfigf ioct1 0000000090 IPOD! 
i U IP 
U U 
61 0000000000 sockaddr ini) [] sin_addr[] D [] [] [] BEBE 
6.2 ifunit("sl0")[][][] D] D] D] D] 6-50 000000 
63 U IPD DD DDD UD 0 UD D U D UD U DUD UD ifaderd D 0 0 D U D D 0 U 
ac ipaddr 000 
64 O00000 IP DD 0 D D 0 0 D UDP D 0 D UD 0 D 0 0 U IP D 0 0 D 0 
65 JÜ ] in_socktrim| JO sin len] B B U HH EH] E] E] U U ED] E] HE E] T) 
sockaddr_in 0000000 
66 JO ON telnet127.0.0 PI 0000 0000000 Ne/2000000090 
OOOOO0000000000000000000000000000000 
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741 LI 
o [] | EL E] o Net/3 | [] Internet L 
[ | | i 0 IP i 
IP 8 
Net/3 | Net/3 
3-19 
7-1 
u a 0 00 0 [] U 
PF INET AF INET Internet 
PFP OSI, PF ISO AF OSI, AF ISO OSI 
PF LOCAL, PF UNIX AF LOCAL, AF UNIX D] DÚ IPC(Unix) 
PF ROUTE AF ROUTE uat 
n/a AF LINK 000 (00000) 
11 HBULBHEHEHBHBEHBHBHH 
PF LOCAL|| AF LOCAL 
POSIX.12 Net/3 PF UNIX[] AF. UNIX[I |] 
Net/3[] [] UNIX o 
PF_UNIX Unix [Stevens 1990] 
PF_ROUTE U U U | O G 180 2L] utl PF OSI 
Net/3 OSI[] 0000000090 
PF INET 
7.2 [JD] Li 
U C 7-2 4 
U [] [] [] 
netinet/domain.h domain] 000 
netinet/protosw.h protosw Ú 00 
netinet/in_proto.c IP domain[] protoswl] ] 
kern/uipc domain.c | 00000000 

















072 2000009900 
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7.2.1 
7-3 L | IO LU | | Net/3 
L 
0 0 u DD 0 0 U 
domain struct domain * 00000 
inetdomain struct domain Internet] [] [| domain] O 
inetsw struct protosw[] Internet] [| [] protosw] H DU Ü 
max_linkhdr int OO 7-17 
max protohdr int OO 7-17 
max hdr int OO 7-17 
max datalen int OD 7-17 
173 00000000000 
7.2.2 uu 
7-4 ip init 
[] Ë D D 0 D [] U 
ip_ifmatrix int[I[ OOO00000000000000000000 












































HT (1000000000 


7.3 domain] |] 

























































































0 | 7-50 U O domain 1000 
: domain.h 

42 struct domain ( 
43 int dom family; /* AF xxx */ 
44 char *dom name; 
45 void (*dom init) /* initialize domain data structures */ 
46 (void); 
47 int (*dom externalize) /* externalize access rights */ 
48 (struct mbuf *); 
49 int (*dom dispose) /* dispose of internalized rights */ 
50 (struct mbuf *); 
51 struct protosw *dom protosw, *dom protoswNPROTOSW; 
52 struct domain *dom next; 
53 int (*dom rtattach) /* initialize routing table */ 
54 (void **, int); 
55 int dom rtoffset; /* an arg to rtattach, in bits */ 
56 int dom maxrtkey; /* for routing layer */ 


57}; . 
—_—_—_o eo _— _ —_ _— POE A 


0 7-5 [D D demain OOO 


























































































































42-57 dom family ( AF INET) | 0 









































“ 








internet” ) 







































































| dom name|| [| ( 
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TCP/IP 2 
fstat (1) dom_name dom_name 
Net/3 
dom_init dom_externalize|| dom dispose 
Unix 

Internet 
dom protoswl| dom protoswNPROTOSW protosw 
dom next 
































domains 



































dom rtattach 























dom rtoffset||dom maxrtkey 




























































































7-6 






























































domains 














domains: 





isodomain: 


inetdomain: 








routedomain: 





[] 7-6 domains [] [] 


7.4 protoswl] [|] 


unixdomain: 















































































































































































































































































































































































































































































































































Net/3 protosw 
domain protosw 
protosw Protosw 7-7 
57 struct protosw { protosw.h 
58 short pr type; /* see (Figure 7.8) */ 
59 struct domain *pr domain; /* domain protocol a member of */ 
60 short pr protocol; /* protocol number */ 
61 short pr flags; /* see Figure 7.9 */ 
62 /* protocol-protocol hooks */ 
63 void (*pr_input) (); /* input to protocol (from below) */ 
64 int (*pr_output) (); /* output to protocol (from above) */ 
65 void (*pr ctlinput) (); /* control input (from below) */ 
66 int (*pr ctloutput) (); /* control output (from above) */ 
67 /* user-protocol hook */ 
68 int (*pr usrreg) (); /* user request from process */ 
69 /* utility hooks */ 
70 void (*pr init) (); /* initialization hook */ 
71 void (*pr_fasttimo) (); /* fast timeout (200ms) */ 
72 void (*pr slowtimo) (); /* slow timeout (500ms) */ 
73 void (*pr drain) (7; /* flush any excess space possible */ 
74 int (*pr sysctl) (); /* sysctl for protocol */ 


75 ); 


TI — — protosw.h 


U 7-7 pro 


tosw 00000 











57-61 









































































































































pr type 









































7-8 
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pr_type | Internet| 
pr_type DO OO Internet] [] 
SOCK_STREAM 020000000090 TCP 
SOCK_DGRAM 000000000090 UDP 
SOCK_RAW 000000000090 ICMP] IGMP) [] [ IP 
SOCK RDM 00000000 (000) n/a 
SOCK SEOPACKET O0OO0000000 n/a 
0 7-8 pr type D U 00000 
pr domain domain pr protocol | pr flags 
7-9 pr flags 
pr flags O [] 
PR ATOMIC OO00000000000000000 
PR ADDR OO0000000000000 
PR CONNREQUIRED 4000000 
PR_WANTRCVD O00000000000000 
PR RIGHTS 00000000 
O0 7-9 pr flags [| [J 
| | PR ADDR | U PR ATOMIC[] PR ADDR[] 
PR CONNREQUIRED|! Li 
[] PR WANTRCVD | [] [] o 
( ) 
PR RIGHTS 
| | | U Unix[] 
7-10 O | O | | | | | | 




























































































pr type 


SOCK STREAM 


SOCK SEOPACKET 


SOCK RDM 


SOCK DGRAM 


SOCK RAW 




















PR 





































































































07-10 4000000 































































































































































































7-10 PR_WANTRCVDL| PR RIGHTS 
PR WANTRCVD 
| Net/3 O protosw utut lU PRxxx[] l] U 
pr_typel] | 7-100 OG ICH OI OT DDD" MOOD pr type 








































































































150 
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inetsw 

















protosw 


domain 














protosw 


TCP/IP 2 
7-100 
. TCP[] SPP([] O XNS ) SOCK STREAM 
E | (UU SOCK_SEOPACKET ut 
PR ATOMIC uu uu O 0 i 
MSG EOR 
SPP[] [| LI LI SOCK_STREAM|| SOCK SEQPACKET 
. SOCK RDM RDP 
RDP[] [Partridge 1987] RFC 115 
[Partridge and Hinden 1990] 
| 7-10 
. uuu UDP) i | SOCK_DGRAM]] [J 
. ICMP SOCK_RAW|] [J Net/3[] 
SOCK_RAW (O 15-8) 

62-68 5 pr_input 
pr_output pr_ctlinput 
pr_ctloutput | pr usrreqi] |] 

III 7-11 
pr usrreq 
TARSAR (0 D D read, write,D D) 
I 
I 
pr_output pr_ctloutput 
GOOOO0O0O00) UODOODUD) 
pr_input pr_ctlinput 
(0000 Tero dO) (IU D ICMP[I D) 
07-11 QOO00 5000000 

69-75 5 pr_init [| pr fasttimo 

pr slowtimo 200 ms[] 500 ms 

pr drain m reclaim ({] 2-13) 

pr sysctl[]| sysct1(8) 

UDP 
7.5 IP] domain[] protosw[] [] 














Internet 






























































| U 7-12 























7-13 







































































| inetsw 
































Internet domain 

inetsw[] pr_protocol pr_type O U U O 
0 0 0 Internet[] [] IP 
1 IPPROTO_UDP SOCK_DGRAM 0000000 UDP 
2 IPPROTO_TCP SOCK_STREAM 000000 TCP 
3 IPPROTO RAW SOCK RAW Internet] D ( O ) IPOD) 
4 IPPROTO ICMP SOCK RAW Internet] 00000 ICMP 
5 IPPROTO IGMP SOCK RAW Internet] DUU D IGMP 
6 0 SOCK_RAW Internet] 00000) POOD) 



















































































































































































[] 7-12 Internet] DD 
in_proto.c 


39 struct protosw inetsw[] = 


40 
41 


{ 


}; 


10, &inetdomain, 0, 0, 

0, ip_output, 0, 0, 

0, 

ip_init, 0, ip_slowtimo, ip drain, ip sysctl 

}, 

{SOCK_DGRAM, &inetdomain, IPPROTO_UDP, PR_ATOMIC | PR_ADDR, 
udp_input, 0, udp_ctlinput, ip_ctloutput, 

udp_usrreq, 

udp_init, 0, 0, 0, udp_sysctl 

}, 

{SOCK_STREAM, &inetdomain, IPPROTO_TCP, PR_CONNREQUIRED | PR_WANTRCVD, 
tep input, 0, tep_ctlinput, tep ctloutput, 

tcp usrreq, 

tcp init, tcp fasttimo, tcp slowtimo, tcp drain, 

F; 

(SOCK RAW, &inetdomain, IPPROTO RAW, PR ATOMIC | PR_ADDR, 
rip_input, rip_output, 0, rip_ctloutput, 

rip_usrreq, 

0, 0, 0, O, 

}, 

{SOCK_RAW, &inetdomain, IPPROTO_ICMP, PR_ATOMIC | PR_ADDR, 
icmp_input, rip_output, 0, rip_ctloutput, 

rip_usrreq, 

0, 0, 0, 0, icmp_sysctl 

}, 

{SOCK_RAW, &inetdomain, IPPROTO_IGMP, PR_ATOMIC | PR_ADDR, 
igmp_input, rip_output, 0, rip_ctloutput, 

rip_usrreg, 

igmp_init, igmp_fasttimo, 0, 0, 

}, 
/* raw wildcard */ 

{SOCK_RAW, &inetdomain, 0, PR_ATOMIC | PR_ADDR, 
rip_input, rip_output, 0, rip_ctloutput, 

rip_usrreq, 

rip init, 0, 0, 0, 

}, 


struct domain inetdomain = 
{AF_INET, "internet", 0, 0, 0, 
inetsw, &inetsw[sizeof(inetsw) / sizeof(inetsw[0])], 0, 


rn_inithead, 32, sizeof(struct sockaddr_in)}; : 
——— HL proto.c 


O 7-13 Internet [] domain |] protosw [] JJ 


152 
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TCP/IP[] | [] 2 
39-77 [| inetsw] [| UU 30 protoswl] | EL E] IPLE] FH] LH] UDE inetsw[0][] U 
O IPUULUI H HE | | L inetsw[3][] inetsw[6]| U 
pr protocol IP[] 0000 inetsw[310 0 
i UDO DO inecsw[6] 000 i HI 0000 i i 
pffindproto|] |] (7.6[] )[] 
[] Net/3 | | inetsw[310 U 0 0 IP E o 
E | OOO inetsw[610 UU [ IP O [| 4.3BSD Reno 
IP HDRINCL (32.80 )| [| inetsw[3][] inetsw[6] |] [] U 
i LU [ [ OOO0000000 POOO U U i D 
OM DUI 0000000090 OM OM OM OM OM 
U uu U JOD traceroutel] [] IP U 
IP] [] 32 | U IP | 7-14 IP protoswl] |] 
protosw inetsw[0] inetsw[3[] 6] O O 
pr_type 0 SOCK_RAW rPrp0000000 
pr_domain &inetdomain &inetdomain 00000 Internet[] 0000 
pr_protocol 0 IPPROTO RAM] O IPPROTO RAW(255)[ 00 0 
D D D (RFC 17000 00000 
OOPOOOOOD 
pr flags 0 PR_ATOMIC/PR_ADDR BH retta 
pr input null rip input N IPO ICMP[] IOMP OOD 
pr output ip output rip output 0000000000 PO 
pr ctlinput null null IPT 0 O 
pr_ctloutput null rip_ctloutput 000000000090 
pr usrreq null rip usrreg 0000000000 
pr_init ip_init null] rip init ip init] 000000 
pr fasttimo null null IPT O O 
pr_slowtimo ip_slowtimo null lg ied pg dgautututü 
pr drain ip drain null 0200000000 
pr_sysctl ip sysctl null U U 0 D 00 
O 7-14 IP inetsv HUDD 
78-81 Internet|] [] [| domain | D 7-130 0 | Internet[] AF INET L 
[] " internet" uut | uut O protoswl] inetswl[] D 
Internet [] rn_initheadl IP | 32 
O LH [] Internet sockaddr inl] |] (16 ) 
inetsw[3][| inetsw[6] | pr protocol[l |] Í | | 
rip init[] || inetsw[6] HT l T 7 | 
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domaininit 


































































































({] 3-23) domaininit domain[] protosw 


































































































domaininit 7-15 





° er S EAT uipc domain.c 
37 /* simplifies code in domaininit */ 


38 #define ADDDOMAIN (x) TV 

39 extern struct domain __CONCAT (x,domain); \ 
40 — CONCAT (x, domai n. dom next) = domains; \ 

41 domains = & CONCAT(K,domainj; \ 

42 ) 

43 domaininit () 

44 I 

45 struct domain *dp; 

46 struct protosw *pr; 

47 /* The C compiler usually defines unix. We don't want to get 
48 * confused with the unix argument to ADDDOMAIN 
49 */ 

50 #undef unix 

51 ADDDOMAIN (unix); 

52 ADDDOMAIN (route); 

53 ADDDOMAIN (inet); 

54 ADDDOMAIN (iso); 

55 for (dp = domains; dp; dp = dp->dom_next) { 
56 if (dp->dom_init) 

57 (*dp->dom_init) (); 

58 for (pr = dp->dom_protosw; pr < dp->dom_protoswNPROTOSW; pr++) 
59 if (pr->pr_init) 

60 (*pr->pr_init) (); 

61 } 

62 if (max_linkhdr < 16) /* XXX */ 

63 max linkhdr = 16; 

64 max hdr = max linkhdr + max protohdr; 

65 max datalen = MHLEN - max hdr; 

66 timeout (pffasttimo, (void *) 0, 1); 

67 timeout (pfslowtimo, (void *) 0, 1); 

68 ) 


—— TO gipc_domain.c 


07-15 [| [| domaininit 










































































































































































37-42 ADDDOMAIN domain ADDDOMAIN(unix) 
extern struct domain unixdomain; 
unixdomain.dom_next = domains; 
domains = &unixdomain; 
_CONCAT sys/defs.h CONCAT 























(unix, domai)h unixdomain 
























































































































































































































































43-54 domaininit ADDDOMAIN 
unix C | Net/3 
ADDDOMAIN 

































































154 





TCP/IP 
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7-16 






























































OSI 



































domains: 


isodomain: 


inetdomain: 





domain 











Unix 








Internet 
















































































protosw 











routedomain: unixdomain: 











































































































































































































































































































































































































































































































































































































































































































































































































07-16 D UO UD D. demain [I] [| [| protosw J [J 
55-61 for 
dom init[]pr init Internet (U 7-13) 
ip init|| udp init|| tcp nit igmp init|| rip init 
62-65 domaininit mbu 
max linkhdr[| max protohdr domaininit 
max linkhdr 16[] 16 4 14 
7-17 7-18 
0 U [ 0 U 
max linkhdr 16 000000000000 
max_protohdr 40 O00000000000000 
max hdr 56 max linkhdr + max protohdr 
maz datalen 44 O0000000000000000 mf] 00000000 
0717 O0O00000000000 
ha max hari 0 — 
m har[] 0000 ` 
WWE iu fom > 
280 0 160 0 400 D 440 D 


MHLEN max_linkhdr max_protohdr 
ju 128[] 0 


m 


ax_protohdr 


O 7-18 mbuf[] 


max datalen 


UDUDUDUDU 














IP 











Internet 










































































TCP 


20 






































max_protohdr 
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66-68  domaininit timeout pfslowtimol| pffasttimo 3 
1 7-19 













































































































































































































































































uipc_domain.c 
153 void pe- 


154 pfslowtimo (arg) 
155 void *arg; 


156 ( 

157 struct domain *dp; 

158 struct protosw *pr; 

159 for (dp = domains; dp; dp = dp->dom next) 

160 for (pr = dp->dom protosw; pr < dp->dom_protoswNPROTOSW; pr++) 
161 if (pr->pr_slowtimo) 

162 (*pr->pr_slowtimo) (); 

163 timeout (pfslowtimo, (void *) 0, hz / 2); 

164 } 

165 void 


166 pffasttimo (arg) 
167 void *arg; 


168 ( 

169 struct domain *dp; 

170 struct protosw *pr; 

171 for (dp = domains; dp; dp = dp->dom_next) 

172 for (pr = dp->dom_protosw; pr < dp->dom_protoswNPROTOSW; pr++) 
173 if (pr->pr_fasttimo) 

174 (*pr->pr_fasttimo) (); 

175 timeout (pffasttimo, (void *) 0, hz / 5); 

176 ) 


RT pc domain.c 


U 7-19 [][] pfslowtimo [| pffasttimo 





















































































































































































































































153-176 for pr slowtimo 
pr fasttimo 500 ms[] 200 ms 
timeout timeout 3-43 


































































































7.6 pffindproto[] pffindtypel] |] 































































































































































































































































































































































































































































































































































































































































































































































































7-20 pffindproto|| pffindtype ( IPPROTO_TCP) 
( SOCK_STREAM) 15 
protosw 
69-84 pffindtype domains 
85-107 pffindprotol| pffindtype domains 
pffindproto (protocol[] type) 
type[] SOCK RAW (pr. protocol 0) 
pffindproto 
pffindproto(PF INET, 27, SOCK RAW); 
inetsw[6] IP Net/3 27 















































































































































































































































IP IP 27 





























































































































1 56 TCP/IP 2 
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27 (RFC 1151) 








































































































































































































protosw 




























































































uipc_domain.c 


struct protosw * 
pffindtype (family, type) 
int family, type; 


{ 


} 


struct domain *dp; 
struct protosw *pr; 


for (dp = domains; dp; dp = dp->dom_next) 
if (dp->dom_family == family) 
goto found; 
return (0); 
found: 
for (pr = dp->dom_protosw; pr < dp->dom_protoswNPROTOSW; pr++) 
if (pr->pr_type && pr->pr_type == type) 
return (pr); 
return (0); 


struct protosw * 



























































































































































86 pffindproto (family, protocol, type) 

87 int family, protocol, type; 

88 ( 

89 struct domain *dp; 

90 struct protosw *pr; 

91 struct protosw *maybe = 0; 

92 if (family == 0) 

93 return (0); 

94 for (dp = domains; dp; dp = dp->dom next) 

95 if (dp->dom_family == family) 

96 goto found; 

97 return (0); 

98 found: 

99 for (pr = dp->dom_protosw; pr < dp->dom protoswNPROTOSW; pr++) ( 
100 if ((pr->pr_protocol == protocol) && (pr->pr_type == type)) 
101 return (pr); 

102 if (type == SOCK_RAW && pr->pr_type == SOCK_RAW && 
103 pr->pr_protocol == 0 && maybe == (struct protosw *) 0) 
104 maybe = pr; 
105 } 
106 return (maybe); 
107 } 
uipc_domain.c 
I 7-20 [| [| pffindproto [| pffindtype 
15.6 
socket (PF INET, SOCK STREAM, 0); /* Ter OQ */ 


pffindtype 
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pffindtype (PF_INET, SOCK STREAM); 














| TCP 











































































































7-12 
SOCK STREAM 
socket (PF INET, SOCK DGRAM, 0); /* ver [][] */ 


pffindtypell | inetsw[2] 



















































































pffindtype (PF_INET, SOCK DGRAM); 



































inetsw[1][] UDP 
























































7.7 pfctlinput|]| | 






































































































































pfctlinput (U 7-21) 






































ICMP 
ICMP pfctlinput ([] 11-14) Internet ( 






































































































































































































































































































































UDP[] TCP) 











142 pfctlinput (cmd, sa) uipc_domain.c 








































































































































































































































































































































































































































































































































































































143 int cmd; 

144 struct sockaddr *sa; 

145 { 

146 struct domain *dp; Ñ 

147 struct protosw *pr; 

148 for (dp = domains; dp; dp = dp->dom_next) 

149 for (pr = dp->dom_protosw; pr < dp->dom_protoswNPROTOSW; pr++) 

150 if (pr->pr_ctlinput) 

151 (*pr->pr_ctlinput) (cmd, sa, (caddr t) 0); 

152 } p 

uipc_domain.c 
07-21 00 pfetlinput 

142-152 for pfctlinput 

pr ctlinput cmd UDP 
udp ctlinput TCP tcp ctlinput 
fo Poog 

7-13 Internet Internet 
IP ip_init 23 24 UDP[] TCP 
ip_protox 





































































































7.8.1 Internet u O 





































































































































































































































































































































































































































































































































































































U U IP | U U UI U U 
protosw Internet 
ip_protox 7-22 
ip_protox IP (ip_p 8-8) inetsw 
6 inetsw[2] 
TCP ip_protox 7-23 





















































































































































158 TCP/IP 2 Chibasbub.toM 
— a 


inetsw[]: 
IP 





07-22 []D ipprotox 0000000000 inetsw [000 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip input.c 
71 void p_mpu 
72 ip_init() 
73 I 
74 struct protosw *pr; 
75 int i: 
76 pr = pffindproto(PF INET, IPPROTO RAW, SOCK RAW); 
77 if (pr == 0) 
78 panic("ip_init"); 
79 for (i = 0; i < IPPROTO MAY; i++) 
80 ip protox[i] = pr - inetsw; 
81 for (pr = inetdomain.dom_protosw; 
82 pr < inetdomain.dom_protoswNPROTOSW; pr++) 
83 if (pr->pr_domain->dom_family == PF_INET && 
84 pr->pr_protocol && pr->pr_protocol != IPPROTO_RAW) 
85 ip_protox[pr->pr_protocol] = pr - inetsw; 
86 ipq.next = ipq.prev = kipa; 
87 ip id = time.tv sec & Oxffff; 
88 ipintrq.ifq maxlen = ipqmaxlen; 
89 i = (if_index + 1) * (if_index + 1) * sizeof(u_long); 
90 ip ifmatrix = (u long *) malloc(i, M RTABLE, M WAITOK); 
91 bzero((char *) ip ifmatrix, i); 
92 T "m 
tp input.c 
1723 lH 
78.2 ip_init 
domaininit ([] 7-15) ip_init 
71-78 pffindproto (inetsw[3] 7-14) 
Net/3 panic 
IP 
79-85 ip_protox pr 
(O 7-22 3) inetsw ( 0 
IPPROTO RAW ) ip_protox inetsw 
protosw pr_protocol 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































86-92 ip init[][][] IP ipq(10.6[] ) ip. id[][] U IP 
(ipintrg [| 50(ipqmaxlen)[] ip id | | 
uuu (10.6[] ) [] ip init ip ifmatrix[] 0 
i 0 
Net/3 0 L LU LU 
H H H gag IFQ MAXLEN) O 
(ipqmaxlen) 0 | adb[] 
O U ipqmaxlen 7-23 IFQ MAXLEN 0 
7.9 syscti|J [| [| 
sysctl Net/3 sysct1(8) 
| 
int sysctl(int * name, u int namelen, void *old, size t * oldlenp, void *new, size t newlen); 
*name namelen *old *new|] 
7-24] 0 0 0 0 
CTL_KERN 7 
CTL_USER 
CTL_NET 
PF_INET 
PF_OSI NS 
.0 
IPPROTO IGMP ‘°° 
IPCTL FORWARDING IPCTL DEFTTL 
IPCTL SENDREDIRECTS 
O 7-24 sysctl 00 J Ú) 
7-24 IP[] OO I 






























































CTL_NET{] PF INEJ[J ol IPCTL FORWARDING 
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net_sysctl 

















































































































sysctl 7-25 Internet 















































































































pr.sysctl 


Lä syscti : ICMPCTL_MASKREPL 


UDPCTL_CHECKSUM 


IPCTL_FORWARDING 


IPCTL_SENDREDIRECTS : 
IPCTL_DEFTTL 































































































































































































































































































































































































































































































































































































































































































07-25 DO Internet [| [| O sysctl OG 
sysctl net sysctl 
protosw pr sysctl 
sysctl sysctl sysctl 
sysctl sysctl switch 
switch net sysctl 
7-26 net_sysctl 
uipc_domain.c 
108 net sysctl (name, namelen, oldp, oldlenp, newp, newlen, p) 
109 int name; 
110 u_int namelen; 
111 void *oldp; 
112 size_t *oldlenp; 
113 void *newp; 
114 size_t newlen; 
115 struct proc *p; 
116 { 
117 struct domain *dp; 
118 struct protosw *pr; 
119 int family, protocol; 
120 ja 
121 * All sysctl names at this level are nonterminal; 
122 * next two components are protocol family and protocol number, 
123 * then at least one additional component. 
124 */ 
125 if (namelen < 3) 
126 return (EISDIR); /* overloaded */ 
127 family = name[0]; 
128 protocol = name[1]; 
129 if (family == 0) 


07-26 [][] net sysctl 
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130 return (0); 
131 for (dp = domains; dp; dp = dp->dom_next) 
132 if (dp->dom_family == family) 
133 goto found; 
134 return (ENOPROTOOPT); 
135 found: 
136 for (pr = dp->dom_protosw; pr < dp->dom protoswNPROTOSW; pr++) 
137 if (pr->pr protocol == protocol && pr->pr_sysctl) 
138 return ((*pr->pr_sysctl) (name + 2, namelen - 2, 
139 oldp, oldlenp, newp, newlen)); 
140 return (ENOPROTOOPT); 
141 ) S ` 
uipc domain.c 
1 7-26 (0) 
108-119 net_sysctl p sysctl p 
120-134 domain protosw 
0 for 
ENOPROTOOPT 
135-141 for pr_sysctl 
pr_sysctl (name+2) 
ENOPROTOOPT 
7-27 Internet pr sysctl 
pr protocol inetsw[] pr sysctl O O O O 
0 0 ip_sysctl IP 8.90 
IPPROTO UDP 1 udp_sysctl UDP 23.119 
IPPROTO_ICMP 4 icmp_sysctl ICMP 11.14] 

















DH 7-27 Internet] [] O O pr sysett [I [|] 














































































































































































































































































































































































































































































































































































































































































































































































































pr sysctl sysctl rtable [] 190 
710 00 
domain|] protosw Net/3 
protosw inetdomain 
inetsw Internet IP inetsw 
IP IP 
domainintl] domains 
| 
pffindprotoll pffindtype 












































































































































pfctlinput 














































































































































































































IP ip protox 











U U 


7.1 pfsfindprotol] |] inetsw[6]| U 


































































































U 80 


IPO D OO U 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































8.1 DD 
IP IP 
IP IP 1 30 90 12 RFC 791 [Postel 198 lal [] IP 
RFC 1122 [Braden 19894] RFC 791 
9 10 8-1 IP 
Jr 
—— DÉI 
fpina: | 
Og 
[] 8-1 IPD 1 D D 
4 IP IP ipintrg 
ipintr ipintrq 
IP 1 
IP ip forward ip forward 
ip output ip output IP 
IP 
ICMP( 11] ) Net/3 icmp_error ICMP icmp 
error mbuf| 

























































































































































































































































































Chi DIE) 





U 8] IP|] U 163 









































0000 IPU D D 0 0 ICMPU 0000 


















































U U ICMpD D U D D 0 0 000 








































































































































































































































































































































































































11| 
82 [nul 
000000000000 00000 8-2000 
0 E U [] 
net/route.h uu 
netinet/ip.h IP D D U 
netinet/ip  input.c IP OOD 
netinet/ip_ output .|cIP[] 0 Ü 
netinet/ip_ cksum.c| Internet] 0000 
082 GOU0000 
8.2.1 000 
U LIP) 0 D 0 0 0 D 0 0 DU U 0 DU UD 8-30 
0 E U DD 0 [] U 
in ifaddr struct in ifaddr F IPT [ll 
ip defttl int IP] D D D D TTL 
ip id int DU D D DD (pp D D 0 0 D ID 
ip_protox int[] IPD D D 0 0 0 0 
ipforwarding int D 0 D DDD ooo 
ipforward rt struct route OOO0000000000 
ipintrq struct ifqueue IPD D 0 Ú 
ipqmaxlen int IPD 0 D D 0 D D 0 0 
ipsendredirects int D D 0 D 0 D ICMPI og? 
ipstat struct ipstat IPO O 
Aaaa aa 3 TD 0 
822 HU 
IP 0 [] 8-4 ipstat[][] [] 8-5| | U netstat-s[] 
| | 0 LU 300 00 i 
ipstat[] J [] [] SNMPJ D 0 
ips_badhlen IPD D D D D 000 D 0 
ips_badlen IPD D 0 IPD D D D D D D DDD D 
ips_badoptions O0000000000000 
ips badsum O00000000 
ips badvers IPD D D D 40 0 0 D 
ips cant forward 000000000090 
ips delivered O000000000 
HS DBBHBDD 























164 


TCP/IP 
































China-pubecom 











0 


ipstat[] 


ips forward 

ips fragdropped 
ips fragments 
ips fragtimeout 


ips noproto 


ips reassembled 


lps tooshort 


te EE EE E EE ER 


lav) 
ET m] 
EVER 


ips toosmall 


ips total 


SNMP DD 








ips_cantfrag 


ips_fragmented 





OO) 
OOO 


ips_localout 














ips_noroute 














ips_odropped 





ips_ofragments 




















ips_rawout 






























































Ooooono EI E) 
CIE) E3 E3 EI EI EI E) 
E3 EJ E3 E3 EJ E3 on 
CU Ed E3 E3 EJ EI on 
CDI E3 E3 EJ E3 E3 E3 
GEA E rtr E E 





ips, redirectsent 

















netstat -s [| [0 


27,881,978 total packets received 
6 bad header checksums 

9 with size smaller than minimum 
14 with data size < data length 

0 with header length < data size 
0 with data length < header length 
0 with bad options 

0 with incorrect version number 
72,786 fragments received 






























ips total 
ips_badsum 
ips_tooshort 
ips_toosmall 
ips_badhlen 
ips_badlen 


 ips badoptions 


ips, badvers 


ips, fragments 






























0 redirects sent 


29,447,726 packets sent from this host 
769 packets sent with fabricated ip header 

0 output packets dropped due to no bufs, etc. 
0 output packets discarded due to no route 
260,484 output datagrams fragmented 
796,084 fragments created 

0 datagrams that can't be fragmented 





0 fragments dropped (dup or out of space) 
349 fragments dropped after timeout 
16,557 packets reassembled ok 

27,390,665 packets for this host 

330,882 packets for unknown/unsupported protocol 
97,939 packets forwarded 
6,228 packets not forwardable 


















ips, cantfrag 


ips fragdropped 
ips fragtimeout 
ips, reassembled 
ips delivered 

ips. noproto 
















ips forward 
ips, cantforward 
ips redirectsent 
ips localout 
ips rawout 
ips odropped 
ips, noroute 

ips fragmented ' 
ips ofragments 




























































































ICMP 




























































































































































































08-5 PHT Hu 
ips_noproto 
32.5 
8.2.3 SNMP 
8-6 IP Net/3 SNMP 
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SNMP[ D Ipstat] J 0 U 
ipDefaultTTL ip_defttl 000000 TTL(64[] ) 
ipForwarding ipforwarding 0200000000 
ipReasmTimeout IPFRAGTTL 0000000 600) 
ipInReceives ips_total O0000P000 
ipInHdrErrors ips badsum+ PIODOOODOO 


ips tooshort+ 
ips toosmall+ 
ips badhlen+ 
ips badlen+ 
ips, badoptions+ 


ips badvers 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ipInAddrErrors ips cantforward NO DO 0 D POOD (Gp output UU) 
ipForwDatagrams ips_forward [1 D] H IP] Ú] 
ipReasmRegds ips_fragments 000000 
ipReasmFails ips_fragdropped+ 000000 
ips fragtimeout 
ipReasmOKs ips reassembled 0000000000 
ipInDiscards «utu» pagada go on 000000 
ipInUnknownProtos ips_noproto pg40000000000000 
ipInDelivers ips_delivered 020000000000 
ipOutReguests ips localout O0O000000000 
ipFragOKs ips, fragmented 2000000090 
iPFragFails ips cantfrag 0000000001000 
ipFragCreates ips_ofragments 0000000090 
ipOutDiscards ips_odropped OOO00000000P000 
ipOutRoutes ips noroute DU D D D D 0 DDD (pn D 0 
[] 8-6 IPO [| SNMP[] [] D D D 
8.3 PI! 
U U U D D D D D Internet 0000 000000000000 38-70 000000 
Internet ul 
IP| 
8-7[] UDP] IP] 00060 
U uui U UU U IP[] UU UU UU UU UU 
u IP UUUUULUU 8-7 U Lu L LU U U U 
OOOOOOOOOOOOOOOO IP (T U T U T T POOOOOO 
U U U 
IP U U UD U D 00 IG 0 0 D 0 0 0 0 0000 (000000100 8-8 
U U IPE D EL 0 0 
[] 8-80 [| ip ( 89500000 E] E] E] Net3[] 0000! IP] O [| 
47-67 |U #ifs 
0000000 IP 0000000000 Ne/30 00 i»000000000000 IP 
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— i 















































































































































—— 00 — 


P vm 


Ea 2 EE RE 


DD 0000 
T press Ge 
k— 00 — 002 ` 003 


pol TER] EET ses | peer 


87 DO0000000000000 
15 16 


i i ip len 
i U U U O! U U 0000000 
ip 14 ip off 
um Tu E 
ip_ ip_p ip_cksum 



















088 PO00000ie000 





Structure of an internet header, naked of options. 


* 
* 
43 * We declare ip len and ip off to be short, rather than u short 
* pragmatically since otherwise unsigned comparisons can result 
* against negative integers quite easily, and fail in subtle ways. 
46 */ 
47 struct ip ( 
48 #if BYTE_ORDER == LITTLE "SEND FAN 


49 u Char ip_hl:4, /* header length */ 
50 ip_v:4; /* version */ 

51 #endif 

52 #if BYTE_ORDER == BIG_ENDIAN 

53 u_char ip_v:4, /* version */ 

54 ip hl:4; /* header length */ 
55 #endif 


089 ip] l 





Ld IP 167 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































56 u char ip tos; /* type of service */ 
57 short ip len; /* total length */ 
58 u short ip id; /* identification */ 
59 short ip off; /* fragment offset field */ 
60 #define IP DF 0x4000 /* dont fragment flag */ 
61 #define IP MF 0x2000 /* more fragments flag */ 
62 #define IP OFFMASK Oxlfff /* mask for fragmenting bits */ 
63 u char ip ttl; /* time to live */ 
64 u_char ip p; /* protocol */ 
65 u short ip sum; /* checksum */ 
66 struct in addr ip src, ip dst; /* source and dest address */ 
67 ); ; 
ip.h 
0182-2015 
IP IP 
IP ip_v 4 ip hl 4 
ip len ip p ip sum 
IP 20 ip_hl 5 5 IP 
ip hl 15 (2* 1) 40 (20+40=60)[] IP 
65535 (2! 1) ip len 16 bit 8-10 
(ip nix 4] O 
U un DO 
(20 Å) (004000) 
ip len [D 
655350 [] 
08-10 [00010000 
ip hl 4 IP| 4 
8.4 DODOL ipintr] |] 
3 4 5 
1) (Y 4.3[] ) 
2) SLIP IP (I 5.3[] ) 
3) looutput sa family 
(U 5.4[] ) 
ipintrq schednetisr 
IP schednetisr ipintr 
ipintr CPU splnet 
8.4.1 ipintr 
ipintr 4 (1) (2) 
(3) (4) ipintr 
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10 8-11 ipintr 
ip_input.c 
100 void P-P 
101 ipintr() 
102 1 
103 struct ip *ip; 
104 struct mbuf *m; 
105 struct ipq *fp; 
106 struct in_ifaddr *ia; 
107 int hlen, s; 
108 next: 
109 /* 
110 * Get next datagram off input queue and get IP header 
111 * in first mbuf. 
112 */ 
113 s = splimp(); 
114 IF. DEQUEUE (&ipintrq, m); 
115 splx(s); 
116 if (m == 0) 
117 return; 
332 goto next; 
333 bad: 
334 m freem(m); 
335 goto next; 
336 3 TS 
ip input.c 
D 8-11 ipintr [][] 
100-117 next ipintr|| ipintrq 
goto next 
ipintr splimp 
( slinput[]ether | input] 
332-336 bad mbuf next 
ipintr bad 
8.4.2 
8-12 ipintrq 
118 P ip input.c 
119 * If no IP addresses have been set yet but the interfaces 
120 * are receiving, can't do anything with incoming packets yet. 
121 */ 
122 if (in_ifaddr == NULL) 
123 goto bad; 
124 ipstat.ips_total++; 
125 if (m-»m len < sizeof (struct ip) Së 


O 8-12 ipintr [ [J 





Chinapubseon m 169 
















































































126 (m = m pullup(m, sizeof(struct ip))) == 0) ( 

127 ipstat.ips_toosmall++; 

128 goto next; 

129 } 

130 ip = mtod(m, struct ip *); 

131 if (ip->ip_v != IPVERSION) { 

132 ipstat.ips_badvers++; 

133 goto bad; 

134 } 

135 hlen = ip->ip_hl << 2; 

136 if (hlen < sizeof(struct ip)) { /* minimum header length */ 

137 ipstat.ips badhlen++; 

138 goto bad; 

139 ) 

140 if (hlen > m->m len) ( 

141 if ((m = m_pullup(m, hlen)) == 0) { 

142 ipstat.ips badhlen++; 

143 goto next; 

144 } 

145 ip = mtod(m, struct ip *); 

146 } 

147 if (ip->ip sum = in cksum(m, hlen)) { 

148 ipstat.ips badsum++; 

149 goto bad; 

150 ) 

151 /* 

152 * Convert fields to host representation. 

153 */ 

154 NTOHS (ip-»ip len); 

155 if (ip-»ip len « hlen) ( 

156 ipstat.ips_badlen++; 

157 goto bad; 

158 } 

159 NTOHS (ip->ip id); 

160 NTOHS (ip->ip off); 

161 /* 

162 * Check that the amount of data in the buffers 

163 * is as at least much as the IP header would have us expect. 

164 * Trim mbufs if longer than we expect. 

165 * Drop packet if shorter than we expect. 

166 */ 

167 if (m->m_pkthdr.len < ip->ip_len) ( c 

168 ipstat.ips_tooshort++; 

169 goto bad; 

170 } 

171 if (m->m_pkthdr.len > ip->ip len) { 

172 if (m->m len == m->m pkthdr.len) ( 

173 m->m len = ip->ip len; 

174 m->m pkthdr.len = ip->ip len; 

175 ) else 

176 m adj(m, ip->ip len - m->m_pkthär.len); 

177 ) ip input.c 
[18-12 (0) 

1. IP 
118-134 in_ifaddr|] ( 6.51 ) IP ipintr 














































































































































































































































































































IP ipintr 


















































170 
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TCP/IP 2 
6.3 
ipint IP ip v[] 4(IPVERSION)[] RFC 1122 
Net/2 ip v IP Net/2 IP 
4 IP IP 
ip_v 
IEN 119 [Forgie 1979] [| RFC 1190 [Topolcic 1990] TP sU 6 
6 IP (IPv6) OU] 15 
C 
2 mbuf 
IP mbu mbu 
IP 
( ) 
135-146 IP ( ) 
° mbuf IP (20 JJ m pullup 
(60 ) IP mbuf 
m pullu 
*ip hl 4 hlen 
. IP! hlen (20 ) 
. mbuf[] ( IP ) m_pullup 
Internet ( 
in_cksum IP IP ( 
) UDP[] TCP 
2. IP 
147-150 ipintr in_cksum ip_sum 
0 
8.7 ip_sum 
in_cksum ip_sum ( 
TTD] ip output 
8.7 in cksum 
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151-160 Internet NTOHS 
IP 16 bit (ip_len) 
(ip_id) (ip off) NTOHS 
Net/3 
4. 
161-177 (ip len) mbuf (m pkthdr.len) 
mbuf 
IP 
IP 
IP| IP 
IP 
8.4.3 
8-13 ipintr ip dooptions( 9] ) IP 
Net/3 
( ) 
ip_input.c 

178 /* pp 

179 * Process options and, if not destined for us, 

180 * ship it on. ip dooptions returns 1 when an 

181 * error was detected (causing an icmp message 

182 * to be sent and the original packet to be freed). 

183 */ 

184 ip_nhops = 0; /* for source routed packets */ 

185 if (hlen > sizeof (struct ip) && ip_dooptions (m) ) 

186 goto next; : 

187 /* 

188 * Check our list of addresses, to see if the packet is for us. 

189 */ 

190 for (ia = in ifaddr; ia; ia = ia->ia next) I 


191 #define satosin(sa) ((struct sockaddr_in *) (sa)) 


192 if (IA_SIN(ia)->sin_addr.s_addr == ip->ip_dst.s_addr) 

193 goto ours; 

194 /* Only examine broadcast addresses for the receiving interface */ 
195 if (ia->ia_ifp == m->m_pkthär.rcvif && 

196 (ia->ia_ifp->if_flags & IFF BROADCAST)) { 

197 u long t; 

198 if (satosin(&ia->ia broadaddr)-»sin addr.s addr == 

199 ip->ip_dst.s_addr) 

200 goto ours; 

201 if (ip->ip_dst.s_addr == ia->ia netbroadcast.s addr) 


O 8-13 [] ipintr 


172 





TCP/IP 2 
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202 goto ours; 
203 FX 
204 * Look for all-0's host part (old broadcast addr), 
205 * either for subnet or net. 
206 */ 
207 t = ntohl (ip->ip_dst.s_addr); 
208 if (t == ia->ia subnet) 
209 goto ours; 
210 if (t == ia->ia net) 
211 goto ours; 
212 ) 
213 ) 
258 if (ip->ip dst.s addr == (u long) INADDR BROADCAST) 
259 goto ours; 
260 if (ip->ip_dst.s_addr == INADDR ANY) 
261 goto ours; 
262 /* 
263 * Not for us; forward if possible and desirable. 
264 */ 
265 if (ipforwarding == 0) ( 
266 ipstat.ips cantforward++; 
267 m freem(m); 
268 ) else 
269 ip forward(m, 0); 
270 goto next; 
271 ours: 
TITT o R p input.c 
[13-13 (01) 
1. 
178-186 ip nhops([] 9.6[] ) 
ip dooptions ip ooption 
ipintr ip dooptions 
ipintr 
ipintr IP ip_dst IP 
ipintr 
2. 
187-261 ipintr in ifaddr([] 6-5) Internet| 
in ifaddr 


















































































































































































































































































































































(O 8-14 ) 
(O 8-14 40) 
(O 12-39) 
( 8-14 




























































































































































































8-14 




































































sun 













































































12 














































































































































































































































































































































































































































































































































































































































































































































































































140.252.1.29 








































































































(U 8.13) 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































.33 127.0.0.1 
ia broadaddr 198-200 
.252.13.224 
ia netbroadcast 201-202 
.255.255 
ia subnet 207—209 
2.13.32 
ia net 210-211 
140.252.0.0 
INADDR BROADCAST 258-259 
255.255.255.255 
INADDR_ANY 260-261 
0.0.0.0 
08-14 BOBO DO DDD 00 00000000 
ia subnet[| ia net[| INADDR_ANY 
4.2BSD TCP/IP 4.2BSD 
3. 
262-271 ip_dst 
ipforwarding ip_forward 
Net/3 in_ifaddr 
RFC 1122 (strong end system) 
(weak end system) 
Net/3 
8.4.4 
ipintr ([] 8-15) 
10 ip 
ip 
325-332 ip pl] ip_protox (U 7-22) inetsw 
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ipintr protosw pr_input 
pr_input ipintr ipintrq 
ipintr IP 
TCP/IP[] SVR4 





















































ip input.c 





325 /* 

326 * If control reaches here, ip points to a complete datagram. 

327 * Otherwise, the reassembly code jumps back to next (Figure 8.11) 
328 * Switch out to protocol's input routine. 

329 x 

330 ipstat.ips_delivered++; 

331 (*inetsw[ip_protox[ip->ip_p]].pr_input) (m, hlen); 

332 goto next; 





85 OOO ip. forward[] |] 


[] 8-15 [| ipintr 


ip, input.c 





































































































ipforwarding 








(6.10 ) 










































































ip forward 












































(9.6[] ) ipintr 
ip dooptions ip forward 
ip forward 8-16 route 



















































































2 srcrt 
































































































































46 struct route ( 


47 struct 
48 struct 


rtentry *ro_rt; 
sockaddr ro_dst; 



































/* pointer to struct with information */ 


/* destination of this route */ 


[] 8-16 route [] [] 






































route.h 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































46-49 route ro rt rtentry ro dst 
Sockaddr ro rt 
18 rtentry 
ip forward IP 
ICMP ip output 8-17 
1. 
867-871 ip_froward 1 mbuf mbuf 
2 srert (U 9.61] ) 
879-884 if 
M_BCAST 
ether input([] 4-13) M BCAST 
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RFC 1122 IP 
in canforward 0 ipintr ip 
forward 
° op E 
in_canforward 0 
s D 
D ip_mforward ip_forward 
in_canforward DU ( ) 
RFC 791 (TTL) 1 TTL 
TTL IP 
1 ip_ttl 1 
Tr a al 


868 ip_forwardím, srcrt) 
869 struct mbuf *m; 


870 int srcrt; 

871 L 

872 struct ip *ip = mtod(m, struct ip *); 

873 struct sockaddr in *sin; 

874 struct rtentry *rt; 

875 int error, type = 0, code; 

876 struct mbuf *mcopy; 

877 n long dest; 

878 struct ifnet *destifp; 

879 dest = 0; 

880 if (m->m flags & M BCAST || in canforward(ip->ip dst) == 0) { 
881 ipstat.ips cantforward++; 

882 m freem(m); 

883 return; 

884 } 

885 HTONS (ip->ip. id); 

886 E if (ip->ip ttl <= IPTTLDEC) { 

887 icmp_error (m, ICMP_TIMXCEED, ICMP_TIMXCEED_INTRANS, dest, 0); 
888 return; 

889 } 

890 ip->ip ttl -= IPTTLDEC; 

891 sin = (struct sockaddr_in *) &ipforward_rt.ro_dst; 
892 if ((rt = ipforward_rt.ro_rt) == E 

893 ip->ip dst.s addr != sin->sin addr.s addr) { 
894 if (ipforward rt.ro rt) ( 

895 RTFREE(ipforward rt.ro rt); 

896 ipforward rt.ro rt = 0; 

897 } 

898 sin->sin_family = AF_INET; 

899 sin->sin_len = sizeof (*sin); 

900 sin->sin_addr = ip->ip_dst; 

901 rtalloc (&ipforward_rt); 


0 8-17 ip forward [000000 
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902 if (ipforward rt.ro rt == 0) { 
903 icmp_error (m, ICMP UNREACH, ICMP UNREACH HOST, dest, 0); 
904 return; 
905 H 
906 rt = ipforward_rt.ro_rt; 
907 } 
908 FE 
909 * Save at most 64 bytes of the packet in case 
910 * we need to generate an ICMP message to the src. 
911 */ 
912 mcopy = m_copy(m, 0, imin((int) ip->ip_len, 64)); 
913 ip_ifmatrix[rt->rt_ifp->if_index + 
914 if index * m->m_pkthär.revif->if_index] ++; ur 
ip input.c 
[15-17 (1) 
Internet 
(diameter) [Olivier 1994] 37 
2. TTL 
885-890 
ip. forward IP ICMP 
Net/3 ipintr ip len 
386 
ICMP IP 386 
SVR4( Net/1[] )[] AIX3.2(4.3BSD Reno[] ) ICMP 
ip tti 1(IPTTLDEC) ICMP 
ip forward||ip ttl IPTTLDEC 
TTL[] Of] IP Net/3 ICMP 
p ttl 
3. 
891-907 IP route ipforward rt 
([Jain[] Routhier 1986][] [Mogul 
1991]) (one-behind) 
(ipforward rt) ipforward rt 
ro dst rtalloc 
ICMP 
908-914 ip_output m_copy 64 
ip_forward ICMP m_copy ip_forward 
ip_ifmatrix 
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ICMP IP 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































08-18 QOORIGO0000 HS) 0 D D 0 R200 HD 
8-18 
HS[] R1 HS HD R2 
RI[] R1 R2 HS 
HS HD R2 
RFC 1122 | | ICMP 
(11.8[] ) Net/3 ip forward 
Net/3 RFC 1122 
8-19 ip forward 
1. 
915-929 (rt ifp 
rcvif) ICMP 
(RTF DYNAMIC|RTF MODIFIED) 
(0.0.0.0) | 












































































































































































































































0.0.0.0 





























































































































































































































0.0.0.0 
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TCP/IP 2 
18 
ipsendredirects (1 8.90) 
ipsendredirects 1 ip_forward srert 
ip_input.c 
915 £* i KORP 
916 * If forwarding packet is using same interface that it came in on, 
917 * perhaps should send a redirect to sender to shortcut a hop. 
918 * Only send redirect if source is sending directly to us, 
919 * and if packet was not source routed (or has any options). 
920 * Also, don't send redirect if forwarding using a default route 
921 * or a route modified by a redirect. 
922 */ 
923 define satosin(sa) ((struct sockaddr in +) (sa)) 
924 if (rt->rt_ifp == m->m pkthdr.revif && 
925 (rt->rt flags & (RTF DYNAMIC | RTF MODIFIED)) == 0 && 
926 satosin(rt_key(rt))->sin_addr.s_addr != 0 && 
927 ipsendredirects && !srcrt) { 


928 #define 





RTA(rt) ((struct in_ifaddr *) (rt->rt_ifa)) 
u_long src = ntohl (ip->ip_src.s_addr); 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































930 if (RTA(rt) && i 
931 (src & RTA(rt)->ia subnetmask) == RTA(rt)->ia subnet) { 
932 if (rt->rt flags & RTF GATEWAY) 
933 dest = satosin(rt->rt gateway)->sin addr.s addr; 
934 else 
935 dest = ip->ip dst.s addr; 
936 /* Router requirements says to only send host redirects */ 
937 type = ICMP_REDIRECT; 
938 code = ICMP_REDIRECT_HOST; 
939 } 
940 } i. 
tp. input.c 
O 8-19 ip forward ([] ) 
2. 
930-931 
IP 
ICMP 
ipforwarding 
( JU Net/3 
3. 
932-940 ICMP 
RFC 792 4 (1) (2) (3)TOS (4)TOS 
RFC 1009 
RFC 1122 
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Net/3 TOS 8-20 
ipintr ICMP 
: - ip input.c 
941 error - ip output(m, (struct mbuf *) 0, &ipforward rt, 
942 IP FORWARDING | IP ALLOWBROADCAST, 0); 
943 if (error) 
944 ipstat.ips_cantforward++; 
945 else { 
946 ipstat.ips_forward++; 
947 if (type) 
948 ipstat.ips_redirectsent++; 
949 else { 
950 if (mcopy) 
951 m freem(mcopy); 
952 return; 
953 } 
954 } 
955 if (mcopy == NULL) 
956 return; 
957 destifp = NULL; 
958 switch (error) { 
959 case 0: /* forwarded, but need redirect */ 
960 /* type, code set above */ 
961 break; 
962 case ENETUNREACH: /* shouldn’t happen, checked above */ 
963 case EHOSTUNREACH: 
964 case ENETDOWN: 
965 case EHOSTDOWN: 
966 default: 
967 type = ICMP_UNREACH; 
968 code = ICMP_UNREACH_HOST; 
969 break; 
970 case EMSGSIZE: 
971 type = ICMP_UNREACH; 
972 code = ICMP_UNREACH_NEEDFRAG; 
973 if (ipforward_rt.ro_rt) 
974 destifp = ipforward_rt.ro_rt->rt_ifp; 
975 ipstat.ips cantfrag++; 
976 break; 
977 case ENOBUFS: 
978 type = ICMP SOURCEQUENCH; 
979 code = 0; 
980 break; 
981 ) 
982 icmp_error (mcopy, type, code, dest, destifp); 
983 } "m 
ip input.c 


O 8-20 ip forward(]) 
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TCP/IP 








[ 2 
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40000 
941-954 ip forward 0000000 ICMP] VUUUU Ip_ 
output] OO [| ipforward_rt | 0 IP ALLOWBROADCAST 0 
n OO ip_output] | 0000 
U 64 ip_forward|] 
5. [| O ICMPO [] 
955-983 ip_forward ip. output| | ICMPI] | D | o 
(| JOD JOD | 3 GE] 0000 ip_forward 
UULU typell codell [] | | ip output switch{] |] 
ip output[] ICMP O icmp error I] Ü Ú] Ú 
ip_outputICMP E Ooo [] 
lip output 0 00 switch] O00 | | U U U ICMP 
| | | U | 8-21 | 11 | | ICMP 
[| ip output[] [| ENOBUFS Net/3 | U ICMP O [] Router 
Requirements([] [] O )RFC [Almquist[] Kastenholz 1994 ]| Hl OO 
| | | i 
O O ip output O00 DU D D teme] Ú [] [] 
EMSGSIZE ICMP UNREACH NEEDFRAG U D D D D D DDD DDD DD DD D 
DU DD DDD (0 100) 
ENOBUFS ICMP_SOURCEQUENCH U D DDD DDD DDD DDD DD D 
O00000000000 
EHOSTUNREACH OOO000000 
ENETDOWN I000000000000 
EHOSTDOWN ICMP UNREACH HOST D D DD DDD DDD DDD D 
default O0O000000000 
ICMP UNREACH HOST J O00 




















8-21 


86 00000 iP_output{] [| 






































O O ip output I 





00 













































































































































































































































































































































































































































































IP| OD ip forward[] E (7 S- D[] [ inetsw[0] 
Dr output IP[] | 0 | 0 0 | | Ü Internet[] 
(ICMP[] IGMP[] UDP[] TCP) ip output [| inetsw[] U [| [| [] Internet[] 

protosw Od uut E 
IP 20 i | pr output[] [| IP] 
U ip output: 



















































































































































































































































































































































































































































































































































































































































































































































































8.6.1 OTU 
8-22 ip output 0 | |H ( 
ip_forward UDD 
44-59 ip_output mo opt IP ro 
flags 8-23[] imo 12] 
IP_FORWARDING|| ip forward||ip mforward( 
ip_output IP 
ae one ip_output.c 
45 ip output (m0, opt, ro, flags, imo) 
46 struct mbuf *m0; 
47 struct mbuf *opt; 
48 struct route *ro; 
49 int flags; 
50 struct ip_moptions *imo; 
51 { 
52 struct ip *ip, *mhip; 
53 struct ifnet *ifp; 
54 struct mbuf *m = m0; 
55 int hlen = sizeof(struct ip); 
56 int len, off, error = 0; 
57 struct route iproute; 
58 struct sockaddr_in *dst; 
59 struct in_ifaddr *ia; 
60 if (opt) { 
61 m = ip_insertoptions(m, opt, &len); 
62 hlen = len; 
63 } 
64 ip = mtod(m, struct ip *); 
65 /* 
66 * Fill in IP header. 
67 */ 
68 if ((flags & (IP FORWARDING | IP RAWOUTPUT)) == 0) { 
69 ip->ip_v = IPVERSION; 
70 ip->ip_off &= IP_DF; 
71 ip->ip_id = htons (ip_id++); 
72 ip->ip_hl = hlen >> 2; 
73 ipstat.ips_localout++; 
74 } else { 
75 hlen = ip->ip_hl << 2; 
76 } ` 
ip. output.c 


H 8-22 I [| ip output 





o d 


IP_FORWARDING 
IP_ROUTETOIF 
IP_ALLOWBROADCAST 
IP_RAWOUTPUT 








U D 


O000000000 
0000000000000 
00000000 
000000 1200000 











H $23 


ip output [] flag [] 


1 82 TCP/IP 2 
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send| | sendto|| sendmsg|| MSG_DONTROUTE IP_ROUTETOIF 
(O 16.4) SO_DONTROUTE IP_ROUTETOIF 
(U 8.80 ) ip_ output 
IP_ALLOWBROADCAST SO_BROADCAST (U 8.80 ) UDP 
IP IP ALLOWBROADCAST[] TCP IP 
ALLOWBROADCAST TCP ip output 
1. IP 
60-73 IP ip insertoptions([]O9.8[]) 
8.8 IP OPTIONS IP 
(TCP[] UDP) ip output 
(IP. FORWARDING) (IP RAWOUTPUT) IP ip 
output ( UDP[] TCP ) IP 
ip outputl| ip v A(IPVERSION) DF ip off 
( 10[] ) ip->ip id 
ip id[]l[] ip id (U 7.80] DØ ip hil 32 bit 
IP —— TTL TOS — 
([] 8-25) 
2 
74-76 ( IP ) ( ) 
hlen | 
8.6.2 OQ 
IP ip output[|l] 8-24 
33 Få ip. output.c 
78 * Route packet. 
79 */ 
80 if (ro == 0) L 
81 ro = &iproute; 
82 bzero((caddr t) ro, sizeof(*ro)); 
83 H 
84 dst = (struct sockaddr in *) &ro->ro_dst; 
85 ZS 
86 * If there is a cached route, 
87 * check that it is to the same destination 
88 * and is still up. If not, free it and try again. 
89 */ 
90 if (ro->ro_rt && ((ro->ro rt->rt flags & RTF UP) == 0 || 
91 dst->sin_addr.s_addr != ip->ip_dst.s_addr)) { 
92 RTFREE (ro->ro rt); 
93 ro->ro rt = (struct rtentry +) 0; 
94 


D 8-24 ip output (DO) 
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95 if (ro->ro_rt == 0) { 

96 dst->sin family = AF INET; 

97 dst-»sin len = sizeof(*dst); 

98 dst->sin_addr = ip-»ip dst; 

99 } 

100 /* 
101 * if routing to interface only, 
102 * short circuit routing lookup. 
103 */ 

104 #define ifatoia(ifa) ((struct in_ifaddr *) (ifa)) 
105 #define sintosa(sin) ((struct sockaddr zi (sin)) 
106 if (flags € IP_ROUTETOIF) ( 

107 if ((ia = ifatoia(ifa ifwithdstaddr(sintosa(dst)))) == 0 ££ 
108 (ia = ifatoia(ifa ifwithnet(sintosa(dst)))) == 0) { 
109 ipstat.ips noroute++; 

110 error = ENETUNREACH; 

111 goto bad; 

112 } 

113 ifp = ia->ia_ifp; 

114 ip-»ip ttl = 1; 

115 ) else ( 

116 if (ro-»ro rt -- 0) 

117 rtalloc (ro); 

118 if (ro-»ro rt == 0) ( 

119 ipstat.ips_noroute++; 
120 error = EHOSTUNREACH; 

121 goto bad; 

122 } 

123 ia = ifatoia(ro->ro_rt->rt_ifa); 

124 ifp = ro->ro_rt->rt_ifp; 

125 ro-»ro rt->rtuse++; 

126 if (ro-»ro.rt-»rt flags & RTF GATEWAY) 

127 dst = (struct sockaddr in *) ro->ro rt->rt gateway; 
128 3 











































































































































































































































































































































































































































































































































































































































































































ip_output.c 
08-24 (0) 
1. 
77-99 ip output ro 24 
UDP[] TCP ip output[] ro 
route iproute 
dst 
2. 
100-114 IP ROUTETOIFO ([ 8.80) 
























































































































































ip output 
ifa ifwithdstaddr in ifwithnet 
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TCP/IP 2 
3. 

115-122 (IP ROUTETOIF ) 

rtalloc dst rtalloc ip output 

EHOSTUNREACH ip_forward ip_output EHOSTUNREACH 
ICMP ip_output (U 8-21) 
123-128 ia (ifaddr ) ifp ifnet 

dst 
IP dst 
8.6.3 
ip_output 8-25 IP 
MTU 
10 
ip_output.c 

212 Zë 

213 * If source address not specified yet, use address 

214 * of outgoing interface. 

215 */ 

216 if (ip->ip_src.s_addr == INADDR ANY) 

217 ip->ip src = IA SIN(ia)->sin addr; 

218 £ 

219 * Look for broadcast address and 

220 * verify user is allowed to send 

221 * such a packet. 

222 EJ 

223 if (in_broadcast (dst->sin_addr, ifp)) ( 

224 if ((ifp->if_flags & IFF_BROADCAST) == 0) ( /* interface check */ 

225 error = EADDRNOTAVAIL; 

226 goto bad; 

227 } 

228 if ((flags & IP_ALLOWBROADCAST) == 0) { /* application check */ 

229 error = EACCES; 

230 goto bad; 

231 } 

232 /* don't allow broadcast messages to be fragmented */ 

233 if ((u_short) ip->ip_len > ifp->if_mtu) { 

234 error = EMSGSIZE; 

235 goto bad; 

236 } 

237 m->m_flags |= M BCAST; 

238 } else 

239 m->m_flags &= "M BCAST; 

240 sendit: 

241 /* 

242 * If small enough for interface, can just send directly. 

243 Ef 

244 if ((u short) ip->ip_len <= ifp->if mtu) ( 


[] 8225 ip output([]) 
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245 ip-»ip len = htons((u short) ip-»ip len); 


246 ip-»ip off - htons((u short) ip-»ip off); 

247 ip->ip sum = 0; 

248 ip->ip sum = in cksum(m, hlen); 

249 error = (*ifp->if output) (ifp, m, 

250 (struct sockaddr *) dst, ro-»ro rt); 
251 goto done; 

252 } 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































339 done: 
340 if (ro == &iproute && (flags & IP ROUTETOIF) == 0 && ro->ro rt) 
341 RTFREE(ro-»ro rt); 
342 return (error); 
343 bad: 
344 m freem(m0); 
345 goto done; 
346 3 ; 
ip output.c 
D 8-25 (0) 
1. 
212-239 ip_src ip_output IP ia 
IP 
IP (IFF_BROADCAST 3-7) 
(IP_ALLOWBROADCAST 8-23) 
IP 
MTU 
EADDRNOTAVAIL[| EACCES|| EMSGSIZE 
M_BCAST 
21.20 arpresolvel] IP 
ip output||M BCAST 
M BCAST 
11 ICMP TCP RST 
(0 26.9] ) 
2. 
240-252 ip len ip off IP| 
in cksum([] 8.7[] ) if output 
3. 
253-338 10 
4. 
339-346 ro ip 




























































































































































































1 86 TCP/IP 
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2 
output route (iproute) RTFREE iproute 
1[] Bad 

0 

8.7 Internet] [| [| O in_cksum|] [] 
([Kay[] Pasquale 1993]) 

mbuf Net/3 

Net/3 in cksum ([] 8-26) 



































































































































Sys/netinet/in cksum.c 
net3/sparc/sparc/in cksum.c 


net3/luna68k/luna68k/in cksum.c 


sys/vax/vax/in_cksum.c 
sys/tahoe/tahoe/in_cksum.c 
sys/hp300/hp300/in_cksum.c 
sys/i386/i386/in cksum.c 


08-26 [] Net/3 [] [] [] in cksum [| [| 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































C RFC 1071 [Braden[] Borman[] Partridge 
1988] [] RFC 1141 [Mallory[] Kullberg 1990] Internet RFC 
1141[] RFC 1624 [Rijsinghani 1994] RFC 1071 
1) 16 bit 
2) 16 bit 
3) 1( 
-0 ) 
0 1 
[Mano 1982] 
IP 
0 ( ) 
16 bit a 0 
a IP a 
(a+- a) 
(a+- a) - O( 1) OJ 0) 
0 8-12 
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C ( Net/3 ) 
































































































































1 unsigned short 
2 cksum(struct ip *ip, int len) 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































3 ( 
4 long sum = 0; /* assume 32 bit long, 16 bit short */ 
5 while (len > 1) { 
6 sum += *((unsigned short *) ip)++; 
7 if (sum & 0x80000000) /* if high-order bit set, fold */ 
8 sum = (sum & OxFFFF) + (sum >> 16); 
9 len -= 2; 
10 } 
11 if (len) /* take care of left over byte */ 
12 sum += (unsigned short) * (unsigned char *) ip; 
13 while (sum >> 16) 
14 sum = (sum & OxFFFF) + (sum >> 16); 
15 return "sum; 
16 } 
0827 HDD DDD D D D 
1-16 sum[] 16 bit 
16 bit RFC 1071 (deferred carries) 
Net/3 C mbuf 
42-140 mbu 
mbuf] 32bit 16 bit 
mbuf mbu 
16 bit 
in_cksum in 
cksum 
93-115 while 16 4 1 
in_cksum.c 


42 #define ADDCARRY (x) (x > 65535 ? x -= 65535 : x) 
43 #define REDUCE (1 util.l = sum; sum = 1 util.s[0] + l_util.s[1]; ADDCARRY (sum) ;} 


44 int 
45 in_cksum(m, len) 
46 struct mbuf *m; 


47 int len; 

48 ( 

49 u_short *w; 

50 int sum = 0; 





0828 PIIODOOOOOOOOOOD en 












































188 remo n: China-bubıcom 
TJ 


51 int mlen = 0; 

52 int byte swapped = 0; 

53 ‚union { 

54 char c[2]; 

55 u short 8; 

56 } s_util; 

57 union { 

58 u_short s[2]; 

59 long 1; 

60 } Lutil; 

61 for (; m && len; m = m->m_next) { 

62 if (m->m_len == 0) 

63 continue; 

64 w = mtod(m, u short *); 

65 if (mlen == -1) ( 

66 /* 

67 * The first byte of this mbuf is the continuation of a 
68 * word spanning between this mbuf and the last mbuf. 
69 * 

70 * s, util.c[0] is already saved when scanning previous mbuf. 
71 */ 

72 S util.c[1] = *(char *) w; 

73 sum += S util.s; 

74 w = fu short *) ((char *) w + 1); 

75 mlen = m->m len - 1; 

76 len--; 

77 ) else 

78 mlen - m->m len; 

79 if (len « mlen) 

80 mlen - len; 

81 len -- mlen; 

82 /* 

83 * Force to even boundary. 

84 */ 

85 if ((1 & (int) w) && (mlen > 0)) { 

86 REDUCE; 

87 sum <<= 8; 

88 s_util.c[0] = *(u_char *) w; 

89 w = (u short *) ((char *) w + 1); 

90 mlen--; 

91 byte_swapped = 1; 

92 } 

93 /* 

94 * Unroll the loop to make overhead from 

95 * branches &c small. 

96 */ 

97 while ((mlen -= 32) >= 0) ( 

98 sum += w[0]; sum += w[1]; sum += w[2]; sum += w[3]; 
99 sum += w[4]; sum += w[5]; sum += w[6]; sum += w[7]; 
100 sum += w[8]; sum += w[9]; sum += w[10]; sum += w[11]; 
101 sum += w[12]; sum += w[13]; sum += w[14]; sum += w[15]; 
102 w += 16; 

103 ) 

104 mlen += 32; 

105 while ((mlen -= 8) >= 0) { 

106 sum += w[0]; sum += w[1]; sum += w[2]; sum += w[3]; 
107 w += 4; 


08-28 (U) 
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108 } 
109 mlen += 8; 
110 if (mlen == 0 && byte swapped == 0) 
111 continue; 
112 REDUCE; 
113 while ((mlen -= 2) >= 0) ( 
114 sum += *wt+; 
115 } 
116 if (byte_swapped) { 
117 REDUCE; 
118 sum <<= 8; 
119 byte_swapped = 0; 
120 if (mlen == -1) { 
121 s util.c[1] = *(char +) w; 
122 sum += s util.s; 
123 mlen = 0; 
124 ) else 
125 mlen = -1; 
126 } else if (mlen == -1) 
127 S util.c[0] = *(char +) w; 
128 } 
129 if (len) 
130 printf("cksum: out of data\n"); 
131 if (mlen == -1) { 
132 /* The last mbuf has odd # of bytes. Follow the standard (the odd 
133 byte may be shifted left by 8 bits or not as determined by 
134 endian-ness of the machine) */ 
135 s_util.c[1] = 0; 
136 sum += S util.s; 
137 } 
138 REDUCE; 
139 return (”sum & Oxffff); 
er) in_cksum.c 
U 8-28 (U) 
RFC 1071 Net/3 
IP TCP[] UDP 
23.12 [Partridge[] Pink 
1993] IP in cksum 
6-8 ( 200 0 IPO 0) 
RFC 
1071 RFC 1141[] 1624 
TTL 



















































































































































































































































































































































































UDP[] TCP 

















































































































































































































23[] 25 UDP[] TCP IP 
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int setsockopt (int s, int level, int optname, void *optval, int optlen) ; 


int getsockopt (int s, int level, int optname, const void *optval, int optlen) ; 








TCP/IP 02 
LU U 0 0 D D D 0 D U D 0 U D U D 32 bit | LU LU U U U U U 1 ./sys/vax/ 
vax/in cksum.c[| [| [| VAX[]] [| [| in_cksum|] 
8.8 setsockopt[] getsockopt | [] [] [] 
Net/3[] [] setsockopt[] getsockopt[] [] L L L) U U U 1) 1) LU LU L L 
i OM i OM 
| 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































32.8] | 





O 8-31 






































[GOOD 
| 0 sock RAW | 

















IPPROTO IPY [| [| ip ctloutput 




















[ 



































IPPROTO_IPJ D D 


0 OO sysct1[] ga 
L | 12 (UI 
setsockopt[] getsockopt 0 0 Net/3[] UU s 
o level | |] 8-29 | | | level | D Í 
17 setsockopt[] getsockopt[] 0 0 
| IP H B WO D H 
U D [] level O O O O 
Ooo [] SOL SOCKET sosetopt[] sogetopt O 17-50 0 17-11 
IP DP IPPROTO_IP ip_ctloutput O 8-31 
TCP IPPROTO_TCP tcp_ctloutput 30.60 
IPPROTO IP ip ctloutput O 8-31 
OM IP rip ctloutput[] 
ICMP IPPROTO IP ip ctloutput 32.80 
IGMP 
[] 8-29 sosetopt [| sogetopt [] [| 
OU OU U U 8-300 [| IPPROTO_IP] 
1 optval DO! 2 030 
00 U Optvall] [| O O O [] 
IP OPTIONS void* in pcbopts 0000000000010 0 
IP_TOS int ip_ctloutput I H U H H H DO DO DOG PTOS 
IP_TTL int ip ctloutput 000000000000 PTTL 
TP RECVDSTADDR | int ip ctloutput 00001000 OO UDP tr Ú 
IP_RECVOPTS int ip_ctloutput 020000000120 0000000090 
00 (00v2P0000O0N0 >) 
IP_RECVRETOPTS | int ip_ctloutput OOO000000000000000 
(U D voro D 0 0 D D ) 
08-30 00000 sock Raw [| SOCK_DGRAM [] SOCK_STREAMR [] O [| IPPROTO IP [] 











TOGO 
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ip output.c 
431 int p_outp 
432 ip_ctloutput(op, so, level, optname, mp) 
433 int op; 
434 struct socket *so; 
435 int level, optname; 
436 struct mbuf **mp; 
437 { 
438 struct inpcb *inp = sotoinpcb(so); 
439 struct mbuf *m = *mp; 
440 int optval; 
441 int error = 0; 
442 if (level != IPPROTO_IP) { 
443 error = EINVAL; 
444 if (op == PRCO_SETOPT && *mp) 
445 (void) m free(*mp); 
446 ) else 
447 switch (op) ( 
448 case PRCO SETOPT: 
449 switch (optname) ( 
493 freeit: 
494 default: 
495 error - EINVAL; 
496 break; 
497 } 
498 if (m) 
499 (void) m_free(m); 
500 break; 
501 case PRCO_GETOPT: 
502 switch (optname) { 
TE 
546 default: 
547 error - ENOPROTOOPT; 
548 break; 
549 } 
550 break; 
551 } 
552 return (error); 
553 } , 
tp. output.c 
[] 8-31 ip ctloutput 00000 
431-447 ip ctloutput op PRCO_SETOPT PRCO_GETOPT 
so level IPPROTO IP|! Optname 
mp mbuf[] m *mp 
mbu 
448-500 setsockopt ( switch 
























































































































































PRCO SETOPT JO ip ctloutput EINVAL 
































192 TCP/IP 












































China-pub.tom 


















































































































































































































































































































































































































































































































































































































































































































































































































































2 
501-553 getsockopt ip_ctloutput ENOPROTOOPT 
mbu 
8.8.4 PRCO_SETOPT|] |] 
PRCO_SETOPT 8-32 
ip_output.c 

450 case IP_OPTIONS: 

451 return (ip_pcbopts (&inp->inp_options, m)); 

452 case IP_TOS: 

453 case IP_TTL: 

454 case IP_RECVOPTS: 

455 case IP_RECVRETOPTS: 

456 case IP_RECVDSTADDR: 

457 if (m->m len != sizeof (int)) 

458 error = EINVAL; 

459 else { 

460 optval = *mtod(m, int *); 

461 switch (optname) { 

462 case IP_TOS: f 

463 inp->inp_ip.ip_tos = optval; 

464 break; 

465 case IP TTL: 

466 inp->inp ip.ip ttl = optval; 

467 break; 

468 #define OPTSET (bit) \ 

469 if (optval) \ 

470 inp->inp_flags |= bit; \ 

471 else \ 

472 inp->inp flags £= “bit; 

473 case IP_RECVOPTS: 

474 OPTSET (INP_RECVOPTS); 

475 break; 

476 case IP_RECVRETOPTS: 

477 OPTSET (INP RECVRETOPTS) ; 

478 break; 

479 case IP_RECVDSTADDR: 

480 OPTSET (INP RECVDSTADDR) ; 

481 break; 

482 } 

483 } 

484 break; . 

tp output.c 
[] 8-32 ip ctloutput 00000 PRCO SETOPT 
450-451 IP OPTIONS ip. pcbopts ([] 9-32) 
452—484 IP TOS IP. TTE IP RECVOPTS IP RECVERTOPTS IP 
RECVDSTADDR m | mbuf | optval 
ip tos ip ttl 
INP RECVOPTS|| INP RECVERTOPTS|| INP RECVDSTADDR optval 
(O 0) OPTSET ( ) 
| 8-30 IP_RECVOPTS|| IP_RECVERTOPTS 23 
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UDP 





































































































8.8.2 PRCO_GETOPT 











































































































































































































































































































































































































































































































8-33 PRCO GETOPT IP 
ip_output.c 
503 case IP_OPTIONS: p_outp 
504 *mp = m = m get(M WAIT, MT SOOPTS); 
505 if (inp->inp options) { 
506 m-»m len = inp->inp options-»m len; 
507 bcopy (mtod(inp-»inp options, caddr t), 
508 mtod(m, caddr t), (unsigned) m-»m len); 
509 ) else 
510 m->m len = 0; 
511 break; 
512 case IP TOS: 
513 case IP TTL: 
514 case IP RECVOPTS: 
515 case IP RECVRETOPTS: 
516 case IP_RECVDSTADDR: 
517 *mp = m = m_get (M_ WAIT, MT_SOOPTS); 
518 m->m_len = sizeof (int); 
519 switch (optname) { 
520 case IP_TOS: 
521 optval = inp->inp_ip.ip_tos; 
522 break; 
523 case IP_TTL: 
524 optval = inp->inp_ip.ip_ttl; 
525 break; 
526 #define OPTBIT(bit) (inp->inp flags & bit ? 1: 0) 
527 case IP RECVOPTS: 
528 optval = OPTBIT(INP RECVOPTS); 
529 break; 
530 case IP RECVRETOPTS: 
531 optval = OPTBIT(INP RECVRETOPTS); 
532 break; 
533 case IP_RECVDSTADDR: 
534 optval = OPTBIT(INP RECVDSTADDR); 
535 break; 
536 } 
537 *mtod(m, int *) = optval; 
538 break; . 
ip output.c 
[] 8-33 ip ctloutput [][][] Preo GETOPT [00 
503-538 IP OPTIONS[| ip ctloutput 
ip ctloutput ip tos[| ip ttl 
m mbuf| inp flags bit ( 
) OPTBIT 1] 0) 




































































8.9 ip sysctl[|[l 






















































































































































































7-27 sysctl 0 ip_sysctl 
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TCP/IP 2 
8-34 ip_sysctl 
sysct1[] U Net/3[] 0 O O 
IPCTL_FORWARDING ipforwarding 0000001000 
IPCTL_SENDREDIRECTS ipsendredirects 00000 CMP 000 
IPCTL_DEFTTL ip_defttl IPO 0000 TTL 
[] 8-34 sysctl O [| 
8-35 ip_sysctl 
984 int ip input.c 


985 ip sysctl(name, namelen, oldp, oldlenp, newp, newlen) 


986 int 


*name; 


987 u_int namelen; 
988 void *oldp; 
989 size_t *oldlenp; 






































































































































































































































































































































































































































































































































































































































990 void *newp; 
991 size t newlen; 
992 1 
993 /* All sysctl names at this level are terminal. */ 
994 if (namelen != 1) 
995 return (ENOTDIR); 
996 switch (name[0]) ( 
997 case IPCTL FORWARDING: 
998 return (sysctl int(oldp, oldlenp, newp, newlen, &ipforwarding)); 
999 case IPCTL SENDREDIRECTS: 
1000 return (sysctl int(oldp, oldlenp, newp, newlen, 
1001 &ipsendredirects)); 
1002 case IPCTL_DEFTTL: 
1003 return (sysctl int(oldp, oldlenp, newp, newlen, &ip_defttl)); 
1004 default: 
1005 return (EOPNOTSUPP); 
1006 } 
1007 /* NOTREACHED */ 
1008 } PNE 
ip input.c 
[] 8-35 ip sysctl UI 
ip sysctl sysctl name 
ENOTDIR 
Switch systl_int ipforwarding 
ipsendredirects[| ip_defttl EOPNOTSUPP 
8.10 1 
IP Internet | | IP 
20 40 IP 
9 10 






































































































































































































































ipintr 
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ip forward lO O TTL| 0 
ip forward 
Internet Internet Net/3[] in cksum IP 
( ) IE D IP 
U U 
8.1 IP! IP 
8.2 ip_forward|] ip output IP 
8.3 | i L L [] M_BCAST IP 
(in canforward) | IP | 
84 IP 
8.5 
8.6 
(ipforwarding 1) 
8.7 8-17 ip ttl[]( ) 1 
8.8 
8.9 8-14 SLIP 8-14 
810 ip_forward icmp_error U id U 
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91 DD 
8 IP (ipintr)[]ll ll u d 000) [ [] 
uu uu 0 uu 0 
RFC 791[] 1122 IP IP 
IP IP 
IP IP 
Net/3 9-1 [] IP 0 
H H 40 
k— ip h1x40 — o 


(200 0) . (0-40[] 0) 
(«90 600 D ————— — ——» 
091 9000000 0-400 d D IPOD 






















































































































































































































































































































































































92 0000 
IP C 9-2 
U [] U Ë 
netinet/ip.h ip timestamp[][] 
netinet/ip var.h ipoption[][] 
netinet/ip input.c 0000 
netinet/ip_output.c ip insertoptions[][] 
092 UD TDD D 0 
9.2.1 HHH 
9-3 (reversal) 
[] U D 0 0 D 0 E 
ip_nhops | int 00000000 
ip srcrt | struct ip srcrt | 000000 

















qe 000000000 
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9.2.2 
[| ipstatl] [] ips. badoptions[] 8-4 
9.3 0000 
IP 0 UI LU U U | | 9-4 
| | 
k— len] O — +>] 
100 000 | type | e [ae data 
P di Tis 000000000000 
~~. 000000 - 
me] = 
1 2 bit 5 bit 
094 JO00000P00000 
1 (type) 
(len) (data) 1 
(offset)U] O U 
1 bit (copied) 2 bit[] (class) 5 bit 
(number) 9-5 IP 









































































































































































































































O O (EOL) 
OP) 


ENEE 
Zi 















































































































































































































































































































































































































































































































































0-00-00111 [] [] 
0-10-00100 [] [] 
IPOPT SECURITY š 1-00-00010 1 OOO 
IPOPT_LSRR E 1-00-00011 O 000000000 (LSRR) 
1-00-00101 O Uum 
IPOPT SATID -0- 1-00-01000 4 000 
IPOPT SSRR - 1-00-01001 O O 0200000000 (SSRR) 
09-5 REC 7910 00 PO O 
1 Net/3 2 3 class O 0 
4 Net/3 Net/3 0 00 
ip_dooptions IP 1 UD 
Net/3 ID] D ID 2 (00000 
ITT RFC 791 : Ed 
[] 9-6 IP[] ODD 
Net/3 (10.40) class [J 
copied IP class | 
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2 
9-6 9-5 class|] 2 class[] 0 
9.4 ip_dooptions[] |] 
8-13 ipintr ip_dooptions 
ip_dooptions m ip_dooptions 
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cp[IPOPT_OPTVAL] 


























Cp[IPOPT OLEN] 


Cp[IPOPT OFFSET] 





type | len | offset 


ip dooptions 
1 ip_dooptions 0 ipintr 
ip_dooptions for 
cp 9-7 cp 
typel] length|] offset 


data 








» 
i 


Jer 10090000000 









































len] O ——P 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































RFC (offset) (pointer) offset 
(U type 1) type 
4(IPOPT MINOFF), 
9-8 ip dooptions 
555-566 ip dooptions[] ICMP type ICMP PARAMPROB 
ICMP_PARAMPROB|| code 
ICMP 
ip 20 ip ip+1 IP 
ip | ip_dooptions IP] O O | 
(u_char) cp IP 
IP 
1. EOL[] NOP 
567-582 for EOL 
( IP! ) NOP 
switch default 
switch ip_dooptions 
switch 
2; 
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719-724 SSRR[] LSRR forward 
ip forward 2 1 
Se tp. input.c 
554 ip dooptions (m) 
555 struct mbuf *m; 
556 ( 
557 struct ip *ip = mtod(m, struct ip *); 
558 u char *cp; 
559 struct ip timestamp *ipt; 
560 struct in ifaddr *ia; 
561 int opt, optlen, cnt, off, code, type = ICMP_PARAMPROB, forward = 0; 
562 struct in addr *sin, dst; 
563 n time ntime; 
564 dst - ip-»ip dst; 
565 cp = (u char *) (ip + 1); 
566 cnt - (ip-»ip hl «« 2) - sizeof(struct ip); 
567 for (; ent > 0; cnt -- optlen, cp += optlen) { 
568 opt = cp[IPOPT_OPTVAL]; 
569 if (opt == IPOPT_EOL) 
570 break; 
571 if (opt == IPOPT_NOP) 
572 optlen = 1; 
573 else { 
574 optlen = cp[IPOPT_OLEN]; 
575 if (optlen <= 0 || optlen > cnt) ( 
576 code = &cp[IPOPT_OLEN] - (u char *) ip; 
577 goto bad; 
578 } 
579 } 
580 switch (opt) { 
581 default: 
582 break; 
719 } 
720 if (forward) { 
721 ip_forward(m, 1); 
722 return (1); 
723 } 
724 return (0); 
725 bad: 
726 ip->ip_len -= ip->ip_hl << 2; /* XXX icmp error adds in hdr length */ 
727 icmp_error (m, type, code, 0, 0); 
728 ipstat.ips badoptions++; 
729 return (1); 
730 } 





ip input.c 


[] 9-8 ip dooptions JJ J 











8.5 ICMP — 


ip_forward 2 
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III] 







































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip_dooptions 1 0 
ipintr 
(ipforwarding 1) 
RFC 1122 
RFC 1127 [Braden 1989c] 
3. 
725-730 switch ip_dooptions bad 
IP icmp error icmp error 
ip_dooptions 1 ipintr 
Net/3 
95 000000 
IP 
40 3 ( 4 
90 (31 4x 9[] 39) 
9-9 9-10 
KS mee address 1 address2 1 address n 
7 4 (offset = 4) (0fset-8) | (offset = 4n) 
1 1 1 
400 400 400 


099 OO0O000000-00=9 


ip_input.c 
647 case IPOPT_RR: 
648 if ( (off = cp[IPOPT OFFSET]) < IPOPT MINOFF) ( 
649 code = &cp[IPOPT OFFSET] - (u char *) ip; 
650 goto bad; 
651 ) 
652 /* 
653 * If no space remains, ignore. 
654 * 
655 off--; /* 0 origin */ 
656 if (off > optlen - sizeof(struct in addr)) 
657 break; 
658 bcopy((caddr t) (&ip->ip_dst), (caddr t) € ipaddr.sin addr, 
659 sizeof(ipaddr.sin addr)); 
660 /* 
661 * locate outgoing interface; if we're the destination, 
662 * use the incoming interface (should be same). 
663 */ | 
664 if (lia = (INA) ifa_ifwithaddr((SA) & ipaddr)) == 0 && 
665 (ia = ip_rtaddr (ipaddr.sin_addr)) == 0) { 
666 type = ICMP_UNREACH; 
667 code = ICMP UNREACH, HOST; 


09-10 [] ip options U 0000000 0 U 
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668 goto bad; 
669 } 
670 bcopy((caddr t) & (IA_SIN(ia)->sin_addr), 
671 (caddr_t) (cp + off), sizeof(struct in_addr)); 
672 cp[IPOPT_OFFSET] += sizeof(struct in_addr); 
k; una 
673 brea. ip_input.c 
19-14 (11) 
647-657 ip_dooptions ICMP 
code bad (U 9-8) 
ICMP code 
658-673 ip_dst ( ) 
ip_rtaddr 
ip_rtaddr ICMP 
1[] 7.3 
ip rtaddr 
ip rtaddr IP 
in ifaddr 9-11 
— ip input.c 
735 struct in ifaddr * 
736 ip_rtaddr (dst) 
737 struct in_addr dst; 
738 I 
739 struct sockaddr in *sin; 
740 sin = (struct sockaddr in *) &ipforward_rt.ro_dst; 
741 if (ipforward_rt.ro_rt == || dst.s_addr != sin->sin_addr.s_addr) { 
742 if (ipforward_rt.ro_rt) { 
743 RTFREE (ipforward_rt.ro_rt); 
744 ipforward_rt.ro_rt = 0; 
745 } 
746 sin->sin_family = AF_INET; 
747 sin->sin_len = sizeof(*sin); 
748 sin->sin_addr = dst; 
749 rtalloc (&ipforward_rt); 
750 } 
751 if (ipforward_rt.ro_rt == 0) 
752 return ((struct in ifaddr *) 0); 
753 return ((struct in ifaddr *) ipforward rt.ro rt->rt ifa); 


754 ) NS 
MM IH input. 


09-11 OD iprtadr D D U OD D 0 U 





1. IP 
735-741 ip_rtaddr dest 
























































































































































































































































202 uu n: China-bubsco 
— COT 














































































































































































































































































































































































































2: 
742-750 ( ) sini 
ro dst W rtalloc 

3. 
751-754 





































































































































































































































































































96 000000000 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































9-12 
AI BO C HS[] HD IP 
A AO As] A; BOC 9-13 
09-12 D DDD U 
— =E 
4 offset address 1 address 2 address n 
(offset = 4) (offset = 8) (offset = 4n) 
1 1 1 400 400 400 
09-13 2000000009 
IP 
9-14 HS[] AI BO CO HD 
1 
HD 9-15 
A; A, 



































































































































































































































































































































































































































































































































UDP[] Net/3 
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ibn 
IE 





























. em C HD | = HD 
Fi = A e° C, HD 
B a Å» B, ° = 
C A, Ba 





RENE mye] am av 


usa DOOO00GG000000000000 





583 p ip input.c 
584 * Source routing with record. 
585 * Find interface with current destination address. 
586 * If none on this machine then drop if strictly routed, 
587 * or do nothing if loosely routed. 
588 * Record interface address and bring up next address 
589 * component. If strictly routed make sure next 
590 * address is on directly accessible net. 
591 * 
592 case IPOPT LSRR: 
593 case IPOPT SSRR: 
594 if ((off = cp[IPOPT_OFFSET]) < IPOPT_MINOFF) { 
595 code = &cp[IPOPT_OFFSET] - (u_char *) ip; 
596 goto bad; 
597 } 
598 ipaddr.sin_addr = ip->ip_dst; 
599 ia = (struct in_ifaddr *) 
600 ifa_ifwithaddr ( (struct sockaddr +) &ipaddr) ; 
601 if (ia == 0) { 
602 if (opt == IPOPT_SSRR) { 
603 type = ICMP_UNREACH; 
604 code = ICMP_UNREACH_SRCFAIL; 
605 goto bad; 
606 } 
607 /* 
608 * Loose routing, and not at next destination 
609 * yet; nothing to do except forward. 
610 */ 
611 break; 
‚ 612 ) 
613 off--; /* 0 origin */ 
614 if (off » optlen - sizeof(struct in addr)) ( 
615 /* 
616 * End of source route. Should be for us. 
617 */ 
618 save rte(cp, ip-»ip src); ] 
619 break; 
620 } 
621 /* 
622 * locate outgoing interface 
623 */ 
624 bcopy((caddr t) (cp + off), (caddr_t) & ipaddr.sin_addr, 
625 sizeof (ipaddr.sin_addr)); 
626 A if (opt == IPOPT_SSRR) { 


627 #define INA struct in_ifaddr * 
628 #define SA struct sockaddr * 
629 if ((ia = (INA) ifa ifwithdstaddr((SA) & ipaddr)) == 0) 


09-15 [] U ip dooptions [| LSRR[] SSRR OOO 
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TCP/IP 2 
630 ia = (INA) ifa_ifwithnet((SA) & ipaddr); 
631 } else 
632 ia = ip rtaddr(ipaddr.sin addr); 
633 if (ia == 0) ( 
634 type = ICMP UNREACH; 
635 code = ICMP UNREACH SRCFAIL; 
636 goto bad; 
637 ) 
638 ip->ip dst = ipaddr.sin addr; . 
639 bcopy((caddr t) & (IA SIN(ia)-»sin addr), 
640 (caddr t) (cp + off), sizeof(struct in addr)); 
641 Cp[IPOPT OFFSET] += sizeof(struct in, addr); 
642 /* 
643 * Let ip_intr’s mcast routing check handle mcast pkts 
644 */ 
645 forward = !IN_MULTICAST (ntohl (ip->ip_dst.s_addr)); 
646 break; "C 
tp input.c 
1.915 (U) 
583-612 A(IPOPT MINOFF) Net/3 ICMP| 
cod 
(IPOPT. SSRR) 
(IPOPT LSRR) IP 
1. 
613-620 off IP ip_dst 
off 
save_rte ip srert ip nhops([] 9-18) 
ip srert ip input.e 
2. 
621-637 ip_dst offset 
ifa_ifwithdst|| ifa_ifwithnet 
) ( ) 
ip rtaddr([] 9-11) 
ICMP 
638-644 ip dooptions[| ip dst off 
IP 
3. 
645-646 forward 1 
ipintr 
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1[] 8.5 





































































































9.6.1 save rte 

























































































































































































































































































































































































RFC 1122 
9-18 save rte 
9-16 ip srert 

- - ip i ; 
57 int ip_nhops = 0; p_Input.c 
58 static struct ip srcrt { 
59 struct in_addr dst; /* final destination */ 
60 char nop; /* one NOP to align */ 
61 char srcopt[IPOPT_OFFSET + 1]; /* OPTVAL, OLEN and OFFSET */ 
62 struct in_addr route[MAX_IPOPTLEN / sizeof(struct in_addr)]; 


63 } ip_srcrt; re 
— n I INOUE 


[ 9-16 [] Ú ip srcrt 

















































































































































































































































































































































































































Route 
Struct in addr route[(MAX IPOPTLEN - 3)/sizeof (struct in addr)]; 
9-26 9-27 
57-63 ip srcrt ` ip srert 
ip srcrt[| save rte ip srert ip srcroute 
9-17 










































































































































































0000 


ip_dooptions 





09-17 po000000000 





SE ip input.c 
760 save rte(option, dst) 
761 u char *option; 
762 struct in addr dst; 
763 { 
764 unsigned olen; 
765 olen = option [IPOPT OLEN]; 
766 if (olen > sizeof(ip_srcrt) - (1 + sizeof(dst))) 
767 return; 
768 bcopy((caddr t) option, (caddr t) ip srcrt.srcopt, olen); 
769 ip nhops = (olen - IPOPT OFFSET - 1) / sizeof(struct in addr); 
770 ip srcrt.dst = dst; 
771 ) ul å 
ip input.c 





U 9-18 UU save rte 
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759-771 ip dooptions save rte 
option dst ip src ( 
9-12 HS) ip_srcrt save_rte 
ip srert (40 ) 
save rte ip srert ip nhops 
dst 
9.6.2 ip sreroute 
ICMP 
ip srcroute 9-19 
ip input.c 

777 struct mbuf * ER 

778 ip sreroute() 

779 I 

780 struct in addr *p, *q; 

781 struct mbuf *m; 

782 if (ip nhops == 0) 

783 return ((struct mbuf *) 0); 

784 m = m get (M DONTWAIT, MT SOOPTS); 

785 if (m == 0) i 

786 return ((struct mbuf +) 0); 

787 #define OPTSIZ (sizeof(ip srcrt.nop) + sizeof (ip srcrt.srcopt)) 

788 /* length is (nhops+1)*sizeof(addr) + sizeof(nop + srcrt header) */ 

789 m->m_len = ip nhops * sizeof (struct in addr) + sizeof(struct in addr) + 

790 OPTSIZ; 

791 /* 

792 * First save first hop for return route 

793 * 

794 p = &ip srcrt.route[ip nhops - 1]; 

795 *(mtod(m, struct in_addr *)) = *p--; 

796 /* 

797 * Copy option fields and padding (nop) to mbuf. 

798 */ 

799 ip_srcrt.nop = IPOPT_NOP; 

800 ip.srcrt.srcopt[IPOPT OFFSET] = IPOPT MINOFF; 

801 bcopy((caddr t) & ip srcrt.nop, 

802 mtod(m, caddr t) + sizeof(struct in addr), OPTSIZ); 

803 q = (struct in_addr +) (mtod(m, caddr t) + 

804 sizeof (struct in addr) + OPTSIZ); 

805 #undef OPTSIZ 

806 Zë 

807 * Record return path as an IP source route, 

808 * reversing the path (pointers are now aligned). 

809 */ 

810 while (p >= ip srcrt.route) { 

811 *q++ = *p--; 

812 ) 

813 /* 

814 * Last hop goes to final destination. 


[] 9-19 


ip srcroute [0 
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815 */ 
816 *q = ip srert.dst; 
817 return (m); 
818 } 
ip input.c 
09-19 (U) 
777-783 ip sreroute ip srert ipoption 
(U 9-26) ip nhops[1 0 
ip sreroute 
8-13 ipintr[] ip nhops 
ip srcroute 
ipintr IP 
(TCP[] UDP) 
784-786 ip nhops[] O[] ip srcroute mbu m len 
(OPTSIZ) 
p ip srcroute mbu 
NOP ( 9.4) 
mbu 
805-818 While IP mbu 
save rte ip srcrt.dst 
mbuf| 9-20 9-12 
. nop (IPOPT NOP) 
ip nhops: 3 
_ srcopt [0] (TPOPT_SSRR) 
400 srcopt [1] (option-length) 


srcopt [2] (option-offset) 












route[0] route[1] route[2] route[3-9] 


dst 
«Pa PES T m [ ses 36] 
k— D0000 | —4 


O 9-20 ip srcroute [| [| ip srcrt JO Ú Ú 








97 00000 






























































































































































UTC 32 bit 


















































































































































































































































































































































































































































208 un n: China+pub.tom 
Saree... s 








































































































































































































































































































































































































Net/3 9-22 ip_timestamp 
114-133 ip (O 8-10) #ifs 9-21 
ipt_flg 
ipt_flg U 0 [] 

IPOOPT TS TSONLY 0 00000 

IPOPT TS TSANDADDR 1 0200000090 
2 oO 

IPOPT_TS_PRESPEC 3 pogo 00000000 
4-15 DO 

09-21 ¿ipe flg [ D D DÚ 








—— ip.h 
114 struct ip timestamp ( 
115 u_char ipt code; /* IPOPT TS */ 
116 u char ipt len; /* size of structure (variable) */ 
117 u char ipt ptr; /* index of current entry */ 
118 #if BYTE ORDER -- LITTLE ENDIAN . 
119 u_char ipt_flg:4, /* flags, see below */ 
120 ipt_oflw: 4; /* overflow counter */ 
121 #endif 
122 #if BYTE_ORDER == BIG_ENDIAN 
123 u_char ipt_oflw:4, /* overflow counter */ 
124 ipt flg:4; /* flags, see below */ 
125 fendif 
126 'union ipt timestamp ( 
127 n long ipt time[1]; 
128 struct ipt ta ( 
129 struct in addr ipt, addr; 
130 n long ipt, time; 
131 ) ipt ta[1]; 
132 ) ipt timestamp; 
133 ); A 
ip.h 


09-22 ip timestamp D0000 













































































































































































































































































































































































ipt_flgl] 3 








































































































oflw 
flg 


1 tr time[1] time[2] 
en|p (ptr = 4) (ptr = 8) 
len|ptr 1 ta[1].addr | ta[1].time 
p (ptr = 4) (ptr =8) 
len|ptr 3 ta[1].addr | ta[1] .time taln] .addr | taln] .time 
p (ptr = 4) (ptr = 8) (ptr = 8n-4) (ptr = 8n) 
T l amu 400 










time [n-2] time [n-1] time[n] 
(ptr =4n-8) | (ptr=4n-4) | (ptr=4n) 
ta [n] .addr | ta [1] .time 
(ptr=8n4) | (ptr=8n) 












400 400 
[9-23 Dm HH HE 00) 
IP 40 9 (ipt. flg[l[] OG 4 
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(ipt flg 1[] 3) 9-24 
674-684 5 ( ) ip_dooptions 
ICMP oflw 
oflw[] 1 16( 4 bit ) ICMP 
ip_input.c 
674 case IPOPT_TS: 
675 code = cp - (u_char *) ip; 
676 ipt = (struct ip_timestamp *) cp; 
677 if (ipt->ipt_len < 5) 
678 goto bad; 
679 if (ipt->ipt_ptr > ipt->ipt_len - sizeof(long)) { 
680 if (++ipt->ipt_oflw == 0) 
681 goto bad; 
682 break; 
683 } 
684 sin = (struct in_addr *) (cp + ipt->ipt_ptr - 1); 
685 switch (ipt->ipt flg) { 
686 case IPOPT_TS_TSONLY: 
687 break; 
688 case IPOPT_TS_TSANDADDR: . 
689 if (ipt->ipt_ptr + sizeof(n_time) + 
690 sizeof (struct in_addr) > ipt->ipt len) 
691 goto bad; 
692 ipaddr.sin_addr = dst; 
693 ia = (INA) ifaof ifpforaddr((SA) & ipaddr, 
694 m->m_pkthär.rcvif); 
695 if (ia == 0) 
696 continue; 
697 beopy((caddr_t) & IA SIN(ia)->sin addr, 
698 (caddr t) sin, sizeof(struct in addr)); 
699 ipt-»ipt ptr += sizeof(struct in addr); 
700 break; 
701 case IPOPT TS PRESPEC: 
702 if (ipt-»ipt ptr + sizeof(n time) + 
703 Sizeof(struct in addr) > ipt->ipt len) 
704 goto bad; 
705 bcopy((caddr t) sin, (caddr t) & ipaddr.sin addr, 
706 sizeof(struct in addr)); 
707 if (ifa ifwithaddr((SA) & ipaddr) -- 0) 
708 continue; 
709 ipt-»ipt ptr += sizeof(struct in_addr); 
710 break; 
711 default: 
712 goto bad; 
713 ) 
714 ntime - iptime(); 
715 bcopy((caddr t) & ntime, (caddr t) cp + ipt-»ipt ptr - 1, 
716 sizeof (n time)); 
717 ipt->ipt ptr += sizeof(n time); 
718 } 
719 } 


— —m__S¿SAKr—) IH IDM 


09-24 [][] ip dooptions DDDODUOUODU 
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1. 
685-687 ipt_flgl 0 (IPOPT_TS_TSONLY) switch 
2. 
688-700 ipt flg[]! (IPOPT TS TSANDADDR) 
( ) Net/3 IP 
ip dooptions ifaof ifpforaddr ( 
00) U U U (INA 
SAN 0009-1500) 
ER [l 
701-710 ipt_flg[] 3 (IPOPT_TS_PRESPEC)] ifa_ifwithaddr 
continuell ip dooptions 
switch 
4. 
711-713 default ipt_flg bad 
714-719 | switch[] | iptime UTC 
ip dooptions 
iptime 
9-25 iptime 
458 n time ip_iemp.c 
459 iptime() 
460 ( 
461 struct timeval atv; 
462 u long t; 
463 microtime (&atv); . 
464 t = (atv.tv_sec % (24 * 60 * 60)) * 1000 + atv.tv_usec / 1000; 
465 return (htonl(t)); 
466 ) SR 
ip_icmp.c 
09-25 DUU iptime 
458-466 microtime UTC1970[] 1[] 1 timeval 
| LU atv 
11 7.4 | 
9.8 ip insertoptions[]|[] 
8.6 ip output ip forward 
ip forward ip output 
ip insertoptions( 8-22 ip output ) 






























































































































































ip forward 
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ip insertoptions ipoption 9-26 

92 struct ipoption ( ip var.h 

93 struct in addr ipopt dst; /* first-hop dst if source routed */ 

94 char ipopt list[MAX IPOPTLEN]; /* options proper */ 

95 Y; 

ip_var.h 
[] 9-26 []  ipoption 

92-95 ipopt_dst 

ipopt_list 40(MAX_IPOPTLEN) 

ipopt_dst 0 
ip srert (U 9-16) ip_srcroute([] 9-19) mbuf 

ipoption 9-27 ip srcrt[] ipoption 

































































































































srcopt [0] 
srcopt [1] 
srcopt [2] 


ip srcrt() 





" : ipopt- N 
ipoption() ipopt list[40] 


09-27 DD ip srcrt [| ipoption 


a 



















































































































































































































































































































































































ip srcrt[] ipoption[] 4 (route[9]) 
44 IP 
(O 9-16) 
ip insertoptions 9-28 
ip output.c 


352 static struct mbuf * 

353 ip insertoptions(m, opt, phlen) 
354 struct mbuf *m; 

355 struct mbuf *opt; 

356 int *phlen; 


357 ( 

358 struct ipoption *p = mtod(opt, struct ipoption *); 
359 struct mbuf *n; 

360 struct ip *ip = mtod(m, struct ip *); 

361 unsigned optlen; 

362 optlen = opt->m len - sizeof(p->ipopt dst); 

363 if (optlen + (u short) ip->ip len > IP MAXPACKET) 
364 return (m); /* XXX should fail */ 
365 if (p->ipopt det. e addr) 

366 ip->ip dst = p->ipopt dst; 

367 if (m->m flags & M EXT || m->m data - optlen < m-»m pktdat) ( 
368 MGETHDR (n, M, DONTWAIT, MT HEADER); 

369 if (n == 0) 


O 9-28 [] [| ip insertoptions 


212 














China=pub.com 


TCP/IP 2 



































































































































































































































































































































































































































































































































































































































370 return (m); 
371 n->m pkthdr.len = m->m_pkthär.len + optlen; 
372 m->m_len -= sizeof(struct ip); 
373 m->m data += sizeof(struct ip); 
374 n->m next = m; 
375 m = n; 
376 m->m len = optlen + sizeof(struct ip); 
377 m->m data += max linkhdr; 
378 bcopy((caddr t) ip, mtod(m, caddr t), sizeof(struct ip)); 
379 ) else ( 
380 m-»m data -- optlen; 
381 m-»m len += optlen; 
382 m-»m pkthdr.len 4- optlen; . 
383 ovbcopy((caddr t) ip, mtod(m, caddr t), sizeof(struct ip)); 
384 } 
385 ip = mtod(m, struct ip *); 
386 bcopy((caddr t) p->ipopt list, (caddr t) (ip + 1), (unsigned) optlen); 
387 *phlen - sizeof(struct ip) * optlen; 
388 ip->ip len += optlen; 
389 return (m); 
390 } A 
ip output.c 
U 9-28 (0) 
352-364 ip insertoptions m opt 
phlen ( ) 
65 535(IP MAXPACKET) 
ip dooptions ip insertoptions 
mbuf () 
(200 0 ) 
(80 D) 
E = m_pktdat 
000000 
000 


m_data 
IP] O 
(200 0 ) 
TCPO O 
1000 D (200 I) 


440 0 





09-29 [][ ip insertoptions [ TCP] [I [] 
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365-366 ipopt_dst.s_addr 
ip_dst 
26.2 TCP MGETHDR[] IP[] TCP mbu 9-29 

367-378 TCP mbu 

mbuf() 
m 00000000 
200 0 200 0 
80 O 
m data PETE EE EE ANA ip 
Pog bcopy 
(200 0) 
ne Es 
TCPO [] 

PO O (200 0 ) 





(optlen[][]) 




























































































































































































































































































[] 9-30 DO ip insertoptions 9000000000 TCPO O Ú 


mbuf{} 


m_pktdat 


m_data 





0 9-31 [| [| ip_insertoptions  [] UDPT] IL 





214 
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TCP/IP 2 
16 367 MGETHDR 
mbuf] 9-30 mbu 
367-378 
ip insertoptions mbu IP 
23.6 UDP M_PREPEND[] UDP[] IP 
9-31 UDP 
367 
379-384 m data[| m len 
optlen IP ovbcopy( 
) 
385-390 ip insertoptions ipoption ipopt list 
IP *phlen 
(ip len) 
9.9 ip pcbopts[|[]| 
ip. pcbopts[] IP IP OPTIONS ip output 
ipoption 9-32 
ip output.c 
559 int p-outp 
560 ip pcbopts (pcbopt, m) 
561 struct mbuf **pcbopt; 
562 struct mbuf *m; 
563 ( 
564 cnt, optlen; 
565 u char *cp; 
566 u char opt; 
567 /* turn off any old options */ 
568 if (*pcbopt) 
569 (void) m free(*pcbopt); 
570 *pcbopt - 0; 
571 if (m == (struct mbuf *) 0 || m->m len == 0) ( 
572 /* 
573 * Only turning off any previous options. 
574 */ 
575 if (m) 
576 (void) m free (m); 
577 return (0); 
578 ) s 
579 if (m->m len $ sizeof(long)) 
580 goto bad; 
581 /* 
582 * IP first-hop destination address will be stored before 
583 * actual options; move other options back 
584 * and clear it when none present. 
585 */ 
586 if (m-»m data 4 m-»m len 4 sizeof(struct in addr) »- &m-»m dat[MLEN]) 
587 goto bad; 
588 cnt = m-»m len; 
589 m-»m len += sizeof(struct in addr); 


[] 9-32 [O [| ip pcbopts 








Chinaspubecom SCH 215 












































590 cp = mtod(m, u char +) + sizeof(struct in_addr); 

591 ovbcopy (mt od (m, caddr t), (caddr_t) cp, (unsigned) cnt); 
592 bzero (mtod(m, caddr t), sizeof(struct in addr)); 

593 for (; cnt > 0; cnt -= optlen, cp += optlen) ( 

594 opt = cp[IPOPT_OPTVAL]; 

595 if (opt == IPOPT_EOL) 

596 break; 

597 if (opt == IPOPT_NOP) 

598 optlen = 1; 

599 else { 

600 optlen = cp[IPOPT OLEN]; 

601 if (optlen <= IPOPT_OLEN || optlen > cnt) 

602 goto bad; 

603 } 

604 switch (opt) { 

605 default: 

606 break; 

607 case IPOPT_LSRR: 

608 case IPOPT_SSRR: 

609 /* 

610 * user process specifies route as: 

611 * ->A->B->C->D 

612 * D must be our final destination (but we can't 
613 * check that since we may not have connected yet). 
614 * A is first hop destination, which doesn't appear in 
615 * actual IP option, but is stored before the options. 
616 */ 

617 if (optlen < IPOPT MINOFF - 1 + sizeof(struct in_addr)) 
618 goto bad; 

619 m-»m len -= sizeof (struct in addr); 

620 cnt -= sizeof(struct in addr); 

621 optlen -= sizeof (struct in addr); 

622 cp[IPOPT_OLEN] = optlen; 

623 /* 

624 * Move first hop before start of options. 

625 */ 

626 bcopy((caddr t) & cp[IPOPT OFFSET + 1], mtod(m, caddr t), 
627 sizeof (struct in addr)); 

628 /* 

629 * Then copy rest of options back 

630 * to close up the deleted entry. 

631 XI 

632 ovbcopy ( (caddr_t) (&cp[IPOPT OFFSET + 1] + 

633 sizeof (struct in addr)), 

634 (caddr t) & cp[IPOPT OFFSET + 1], 
635 (unsigned) cnt + sizeof (struct in addr)); 
636 break; 

637 } 

638 1 

639 if (m->m_len > MAK IPOPTLEN + sizeof(struct in_addr)) 

640 goto bad; 

641 *pcbopt = m; 

642 return (0); 

643 bad: 

644 (void) m_free(m); 

645 return (EINVAL); 

646 ) 





ip_output.c 


09-32 (0) 


216 
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TCP/IP 2 
559-562 pcbopt 
m 
IP_OPTIONS LSRR SRR 
IP 
9-14 
1. 
563-580 m_free|| *pcbopt 
4 bit ip_pcbopts bad 
EINVAL 
ipoption 9-33 
uu 











U 9-33 ip pcboets 00000 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2. 
581-592 4 
in addr JU ovbcopy bzero 4 
3. 
593-606 or LSRR[] SSRR 
4. LSRR[] SSRR 
607-638 LSRR[] SSRR 
4 
bcopy ovbcopy 4 
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5. 
639-646 ( ) 44 (MAX_IPOPTLEN +4) 
IP *pcbopt 
9.10 IDOL 
IP 1 
pingl] traceroute IP 
Telnet[] FTP 
IP 
40 
IPv6 
IP 
(10.6[] ) 
9.11 DD 
IP ID Net/3 
40 IP 
save_rte ip_srcroute 
RFC 1122 
Net/3 
ip_insertoptions 
U U 
9.1 
9.2 IP 
9.3 
9.4 NOP 9-16 ip srert 
9.5 
9.6 ip dooptions dest[] ([] 9-8) 


































































































































































































U 100 


Chinas pub cM 


POD00060 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































10.1 OQ 
8 IP 
IP 
IP 
IP 
IP IP 
8-5 0.3%(72 786/27 881 978) 0.12% (264 484/ 
(29 447 726-796 084)) world.std.com 
9.5% world NFS IP 
IP (ip_id) (ip off[] 3 
) (ip off] 13 ) I bit 0 
0 10 * ” (DF) 2[] " " (MF) Net/3 
ip off 10-1 
ip off o pris U 0 0 U 
111 
130 O 
D) 10-1 ip off DD IPL D D D D 
Net/3 IP_DF[] IP MF ip_off DF[] MF[] IP 
DF 
UDP[] TCP Net/3 DF 
IP ( 320 ) IP 
DF TCP| u MTU (path MTU discovery)” 
ip_off 13 bit 8 
8 8 
10-2 IP 
(ip off 13 bit) 
10-2 IP 8190 3 
8 MF 






















































































































































































































































































Chinaspubecom SCH 219 
























































00000... — ——.- — 


0 78 15 16 23 24 65511 Sia 
E | | L lS 
ip off=0 MF-0 
: soo : 80D : 800 : : 800 :3: 
: : : DU 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































200 0 : ; 
mom | | 
ip_off=0 MF=1 
200 D sog ` : 
META JI ` 
200 D soo: : 
ip_off=2 MF=1 
200 O : 80 O U = 
| 
ip off=8188 MF-1 : 
200 Ú soo: : 
PO O E 
ip_off=8189 MF=0 
200 0 30 0 
0 10-2 655350 00000000 
(ip off) 
65514 
65535 — ip_len ip_off 
8189(8189x 8265512) 3 IP 
IP 
ip_id 
(ip_src) (ip_dst) (ip_p) 
ip_id 
ip_id ip_off 
MF 
10.2 TON 
D U U D C 
10-3 





















































netinet/ip_var.h 000000 


netinet/ip_output.c 0000 
netinet/ip_input.c 0000 


0103 0000000 





220 
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TCP/IP [l-2 
10.2.1 | 
ipq 10-4 
U U U Ë 0 E 
ipq struct ipq *| 000 
[] 10-4 [00000000 
10.2.2 D 
10-5| 8-4[] ipstatl] 
T = 
ipstat[] [| [] 
ips cantfrag U DD DDD DEO D D 00000000000 
ips_odropped D D 000000000000 
ips ofragments 0000000 
ips_fragmented | 000000000 
010-5 Dd d B a D D U 
10.3 DD 
ip output 8-25 
MTU 
. (O 10-6) 
. (O 10-7) 
. ( 10-8) 
5 = ip output.c 
254 * Too large for interface; fragment if possible. 
255 * Must be able to put at least 8 bytes per fragment. 
256 Sy 
257 if (ip->ip off & IP DF) { 
258 error = EMSGSIZE; 
259 ipstat.ips_cantfrag++; 
260 goto bad; 
261 3 
262 len = (ifp->if mtu - hlen) & ^7; 
263 if (len < 8) { 
264 error = EMSGSIZE; 
265 goto bad; 
266 } . 
ip output.c 
U 10-6 QQ ip output [1l U0 0 0 D 
253-261 [] mbu 0 DF 































































































































































































Chi a-bubıcoN 100 IP 



























































221 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip_output EMSGSIZE 
ip_forward ICMP 
(O 8-21) 
Net/3 Ñ MTU " 
1[] 11.8 24.2 UDP[] TCP MTU 
262-266 len MTU 
3 (& 7) 8 MTU 8 
ip output EMSGSIZE 
IP| len 

10-7 C 2 

(O 10-8) 
ip output.c 

267 { p-outpu 
268 int mhlen, firstlen - len; 
269 struct mbuf **mnext - &m-»m nextpkt; 
270 /* 
271 * Loop through length of segment after first fragment, 
272 * make new header and copy data of each part and link onto chain. 
273 Ef 
274 m0 = m; 
275 mhlen = sizeof (struct ip); 
276 for (off = hlen + len; off < (u short) ip->ip_len; off += len) { 
277 MGETHDR (m, M_DONTWAIT, MT_HEADER); 
278 if (m == 0) { 
279 error = ENOBUFS; 
280 ipstat.ips odropped++; 
281 goto sendorfree; 
282 } 
283 m->m_data += max linkhdr; 
284 mhip = mtod(m, struct ip *); 
285 *mhip = *ip; 
286 if (hlen > sizeof(struct ip)) ( 
287 mhlen = ip optcopy (ip, mhip) + sizeof(struct ip); 
288 mhip->ip_hl = mhlen >> 2; 
289 } 
290 m->m_len = mhlen; 
291 mhip->ip_off = ((off - hlen) >> 3) + (ip->ip off & ^IP MF); 
292 if (ip->ip_off & IP MF) 
293 mhip->ip off |= IP MF; 
294 if (off + len >= (u short) ip-»ip len) 
295 len = (u short) ip->ip len - off; 
296 else š 
297 mhip->ip_off |= IP MF; 
298 mhip->ip_len = htons((u_short) (len + mhlen)); 
299 m->m_next = m copy(m0, off, len); 
300 if (m->m_next == 0) ( 
301 (void) m_free(m); 
302 error = ENOBUFS; /* ??? */ 
303 ipstat.ips_odropped++; 
304 goto sendorfree; 
305 } 
306 m->m pkthdr.len = mhlen + len; 


0 10-7 QQ ip output UUUUUU 











222 


TCP/IP 
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307 m->m_pkthdr.rcvif = (struct ifnet +) 0; 
308 mhip->ip_off = htons((u_short) mhip->ip_off); 
309 mhip->ip_sum = 0; 
310 mhip->ip_sum = in_cksum(m, mhlen); 
311 *mnext = m; 
312 mnext = &m->m_nextpkt; 
313 ipstat.ips_ofragments++; 
314 } 
ip_output.c 
U 10-7. (0) 
ip output.c 
315 /* p_outp 
316 * Update first fragment by trimming what’s been copied out 
317 * and updating header, then send each fragment (in order). 
318 */ 
319 m = m0; 
320 m_adj(m, hlen + firstlen - (u_short) ip->ip_len); 
321 m->m pkthdr.len = hlen + firstlen; 
322 ip->ip_len = htons((u short) m->m_pkthdr.len); 
323 ip->ip off = htons((u short) (ip->ip_off | IP_MF)); 
324 ip->ip_sum = 0; 
325 ip->ip_sum = in_cksum(m, hlen); 
326 sendorfree: 
327 for (m = m0; m; m = m0) { 
328 m0 = m->m_nextpkt; 
329 m->m_nextpkt = 0; 
330 if (error == 0) 
331 error = (*ifp->if_output) (ifp, m, 
332 (struct sockaddr *) dst, ro->ro_rt); 
333 else 
334 m freem(m) ; 
335 } 
336 if (error == 0) 
337 ipstat.ips fragmented++; 
338 } 2 
ip_output.c 
U 10-8 QQ ip output [0000 
267-269 mhlen[| firstlen|| mnext 
270-276 for 2 
hlen+len ip output 
«277-284 m_data 16 
(max_linkhdr) ip_output 
mbu 
e 285-290 IP| IP 
ip optcopy (10.4[] ) 
e 291-297 MF (ip_off) MF 
MF MF 
MF 
° 298 (ip_optcopy ) 
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«299-305 m copy 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































mbufl m_copy ENOBUFS[] sendorfree 
° 306-314 mbu 
ip_off m_nextpkt 
10-8 ip_output 
315-325 MF 
ip_len[] ip off IP 
IP (O 10-28) 
326-338 ip_output 
for error 
10.4 ip_optcopy[] [] 
ip_optcopy([] 10-9) ( ) 
( ) 
ip_output.c 
395 int p_outp 
396 ip_optcopy (ip, jp) 
397 struct ip *ip, *jp; 
398 I 
399 u char *cp, *dp; 
400 int opt, optlen, cnt; 
401 cp = (u char *) (ip + 1); 
402 dp = (u char *) (jp + 1); 
403 ent = (ip->ip hl << 2) - sizeof(struct ip); 
404 for (; ent > 0; ent -= optlen, cp += optlen) { 
405 opt = cp[0]; f 
406 if (opt == IPOPT_EOL) 
407 break; 
408 if (opt == IPOPT_NOP) { 
409 /* Preserve for IP mcast tunnel’s LSRR alignment. */ 
410 *dp++ = IPOPT_NOP; 
411 optlen = 1; 
412 continue; 
413 } else 
414 optlen = cp[IPOPT OLEN]; 
415 /* bogus lengths should have been caught by ip_dooptions */ 
416 if (optlen > cnt) 
417 optlen = cnt; 
418 if (IPOPT COPIED(opt)) { 
419 bcopy((caddr t) cp, (caddr t) dp, (unsigned) optlen); 
420 dp += optlen; 
421 } 
422 } 
423 for (optlen = dp - (u char *) (jp + 1); optlen & 0x3; optlen++) 
424 *dp++ = IPOPT_EOL; 
425 return (optlen); 
426 } I 
ip output.c 


0109 [00000000 






































224 rem 02 China=pubscom 
LAT eena 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































395-422 ip_optcopy ip IP jp 
IP ip optcopy cpl] dp 
cpl] dp for 
EOL NOP 
Net/2 NOP 
IPOPT_COPIED copied ip_optcopy 
9-5 copied 
ip_dooptions 
423-426 20 for] U 4 (ip hlen) 
4 
32 bit 
32 bit 32 bit CPU 32 bit 
CPU 
10-10 ip optcopy 
200 D 120 0 " jy HDD s 
[ms C] w The ans 
200 0 ung 


0109-10 [O00O000000000 















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































10-10 ip optcopy ( copied 0) 
LSRR ( copied, 1) 4 ip optcopy 
EOL 
105 QQ 
( ) ipintr 
8-15 ipintr ipintr 
ipintr ip_reass 
10-11 ipintr 
271-279 ip_off DF MF MF 
DF 
10-11 else 
280-286 m_pullup mbu | 
IP SLIP (5.30 00 Ú] 
m_devget IP (2.6[] ) mtodl] (2.6[] ) 
















































































































































































Chinaspubecom - 225 













































































































































































m pullup IP mbuf| 
ip_input.c 
271 ours 
272 /* 
273 * If offset or IP_MF are set, must reassemble. 
274 * Otherwise, nothing need be done. 
275 * (We could look in the reassembly queue to see 
276 * if the packet was previously fragmented, 
277 * but it’s not worth the time; just let them time out.) 
278 */ 
279 if (ip-»ip off & "IP DF) { 
280 if (m->m flags & M EXT) { /* XXX */ 
281 if ((m = m pullup(m, sizeof (struct ip))) == 0) { 
282 ipstat.ips_toosmall++; 
283 goto next; 
284 } 
285 ip = mtod(m, struct ip *); 
286 } 
287 pe 
288 * Look for queue of fragments 
289 * of this datagram. 
290 Wi 
291 for (fp = ipq.next; fp != &ipg; fp = fp->next) 
292 if (ip->ip_id == fp->ipg id && I 
293 ip->ip_src.s_addr == fp->ipg src.s addr && 
294 ip->ip_dst.s_addr == fp-»ipq dst.s addr && 
295 ip-»ip p == fp-»ipq p) 
296 goto found; 
297 fp = 0; 
298 found: 
299 /* 
300 * Adjust ip len to not reflect header, 
301 * set ip mff if more fragments are expected, 
302 * convert offset of this to bytes. 
303 */ 
304 ip->ip len -= hlen; 
305 ((struct ipasfrag +) ip)->ipf mff Ke ^1; 
306 if (ip->ip off & IP MF) 
307 ((struct ipasfrag *) ip)->ipf mff |= 1; 
308 ip->ip off <<= 3; 
309 1* 
310 * If datagram marked as having more fragments 
311 * or if this is not the first fragment, i 
312 £ attempt reassembly; if it succeeds, proceed. 
313 */ 
314 if (((struct ipasfrag *) ip)->ipf mff & 1 || ip->ip off) ( 
315 ipstat.ips fragments++; 
316 ip = ip reass((struct ipasfrag *) ip, fp); 
317 if (ip == 0) j 
318 goto next; 
319 ipstat.ips_reassembled++; 
320 m = dtom(ip); 
321 ) else if (fp) 
322 ip_freef (fp); 
323 } else 
324 ip->ip_len -= hlen; ip_input.c 


0 10-11 00 äpintr II 000 


226 


























China 


ub. COM 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
287-297  Net/3 ipq 
“ (Zist)” 
ipintr 4 lip id 
ip src[] ip dst[] ip. p) ipq ipintr 
fp 
Net/3 
298-303 found ipintr 
«304 ipintr ip_len IP 
U ip len g 0 ip_len 
ip_len 
e 305-307 ipintr[] MF ipf_mff ip_tos (Si="1 
) ipf_mff ip ipasfrag 
10.6 10-14 ipasfrag 
RFC 1122 IP 
ip_tos IP ip_tos TOS 
0 ip off( MF ) 
MF 
ip off 16 bit 3 13 bit 
° 308 sl] ip off 8 1 
ipf mff[] ip off ipintr 10-12 
fol] U l! U ip_reass 
309-322 ip_reass U 
ip_reass 
ipintr next ([ 8-12) 
ip_off ipf_mff fp 0 U O O 
0 [] Ë 00000 U 0 0 000 
0 [ U U O0000 OO00000 
U U [ U 0000000 DU D 0 D 00000000 U 
U U [] U U O000000000 U D 0000 DDD DDD 00 0 
U U [ [ O00000000 U D 0000 D U 
U U [ U U O00000000000 | 0O00000000000000 
0 10-12 ipintr [] ip reass [I PI DL] D 
323-324 else 
ip hlen 





























































































































































































































ipintr 











































































































Chinaspubecom - 227 



















































































(U 8-15) 


(*inetsw[ip protox[ip->ip pll.pr input) (m,hlen); 











10.6 ip reass] [J 

































































ipintr ip reass ipq 


























































































































ip reass 

































































































































































































































































ipq 

10-13 

52 struct ipq { pan 

53 Struct ipq *next, *prev; /* to other reass headers */ 

54 u_char ipq ttl; /* time for reass q to live */ 

55 u char ipq p; /* protocol of this fragment */ 

56 u short ipq id; /* sequence id for reassembly */ 

57 Struct ipasfrag tipa next, *ipq prev; 

58 /* to ip headers of fragments */ 

59 struct in_addr ipq src, ipq dst; 

60 y; 


































































































































































































































































































































































































































































































0 10-13 ie D 
52-60 ip idl| ip src|[] ip dat) ip_p 
ipq Net/3[] next[] prev ipg next 
ipq prev 
IP ipasfrag (U 10-14) 
ip, var.h 


66 struct ipasfrag ( 
67 #if BYTE ORDER -- LITTLE ENDIAN 














































































































68 u_char ip hl:4, 
69 ip_v:4; 
70 tendif 
71 #if BYTE_ORDER == BIG_ENDIAN 
72 u_char ip_v:4, 
73 ip_hl:4; 
74 #endif 
75 u_char ipf_nff; /* XXX overlays ip_tos: use low bit 
76 * to avoid destroying tos; 
77 * copied from (ip_off&IP_MF) */ 
78 short ip_len; 
79 u short ip id; 
80 short ip off; 
81 u char ip ttl; 
82 u char ip_p; 
83 u short ip sum; 
84 struct ipasfrag *ipf next; /* next fragment */ 
85 struct ipasfrag *ipf prev; /* previous fragment */ 
86 }; I 
ip var.h 
O 10-14 ipasfrag |] 
66-86 ip_reass ipf next|]ipf prev 
IP ipf mff ip 




















































































































































































































228 


TCP/IP 



























































































































































(ipq) 





























ipasfragt} 


ipf_next 


ipasfrag{} 





(ipasfrag) 





China-pubecom 


















































ipasfrag{} 


-L—— Got prev je 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































000000 
000000 
U 
O 10-15 000000 aea D D D 
10-15 ipd ipq 
ipq next[] prev 
ipq 
10-15 
mbuf ip 
10-16 mbuf[] ipq ipasfrag ip 
10-16 
. mbu 
*ipq next[| prev ipq ipq 
IP (D 10-16 ) 
. ipq ipasfrag 
ipf_next|| ipf prev ipq ipq next||ipq prev 
. ipasfrag ip 
ipasfrag ip 













































































































































































Chinaspubecom - 229 






























































id 






ipq() 





hl l 


= Peer 


D 10-16 O0O0000000000000 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































10-15 10-16 ip_reass 
10-17 ipq 
ipasfrag 
fp 
ipat} 
ipd: 
ipat} 
ip_id=5 
ipasfrag() ipasfrag{} ipasfrag{} 
0 MF 271 544 Mr 814/816 1031 
ipai) 
ip id=6 
ipasfragt} ipasfrag() 
272 ME 543/544 Mr 815 
ipa{} 
ip_id=7 
ipasfrag{} 
816 1031 
U 10-17. D D POOOOOO 
ip id MF MF 
IP 
IP UDP 1024 
1052(20+8+1024) 1500 MTU 
SLIP 
296 SLIP MTU 4 1 
20 IP 8 UDP 264 2 3 20 IP 
272 20 216 (1032-2724 3+216) 
10-17 5 272-543 6 


































































































































































































2 3 0 TCP/IP 






































China-pubecom 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2 
0-271 816 0-815 
10-18 ip_reass IP 
ipintr ip_reass 
ip input.c 
337 /* 
338 + Take incoming datagram fragment and try to 
339 * reassemble it into whole datagram. If a chain for 
340 * reassembly of this datagram already exists, then it 
341 * is given as fp; otherwise have to make a chain. 
342 */ 
343 struct ip * 
344 ip_reass(ip, fp) 
345 struct ipasfrag *ip; 
346 struct ipq *fp; 
347 { 
348 struct mbuf *m = dtom(ip); 
349 struct ipasfrag *q; 
350 struct mbuf *t; 
351 int hien = ip->ip_hl << 2; 
352 int i, next; 
353 FE 
354 * Presence of header sizes in mbufs 
355 £ would confuse code below. 
356 */ 
357 m->m data += hlen; 
358 m->m len -= hlen; 
465 dropfrag: 
466 ipstat.ips fragdropped++; 
467 m_freem(m); 
468 return (0); 
469 } o 
ip input.c 
[] 10-18 0 O ip reass [00000 
343-358 ip_reass ip fp ipq 
ip_reass mbuf[] m data 
m len IP 
465-469 dropfragl| dropfrag 
ips_fragdropped 
TCP 
UDP [Kent[] Mogul 1987] 
IP 576 
27.5 TCP 
UDP UDP ( RIP[] TFTP 
BOOTP[] SNMP[] DNS) 576 
7 10-19 






































































































































Chinaspubecom - 231 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip i a 
ne m p input.c 

360 * If first fragment to arrive, create a reassembly queue. 

361 */ 

362 if (fp == 0) { 

363 if ((t = m get (M_DONTWAIT, MT FTABLE)) == NULL) 

364 goto dropfrag; 

365 fp = mtod(t, struct ipq *); 

366 insque (fp, &ipq); 

367 fp-»ipq ttl = IPFRAGTTL; 

368 fp->ipg p = ip-»ip p: 

369 fp->ipg id = ip->ip id; 

370 fp-»ipq next = fp-»ipq prev = (struct ipasfrag *) fp; 

371 fp-»ipq src = ((struct ip *) ip)-»ip src; 

372 fp-»ipq dst = ((struct ip *) ip)-»ip dst; 

373 q - (struct ipasfrag *) fp; 

374 goto insert; 

375 ) s. 

ip input.c 
0 10-19 0 0 ip reass 000000 
1. 

359-366 fp ip_reass 

mbuf| ( ipq ) insque 

10-20 
Net/3[] 386 machdep.c insque[] remque 
CPU 
insque[] remque Net/3 
( 10-14) 
insque[] remque VAX insque[] remque 
ipasfrag (U 10-14)[] Net/3 
ip deql| ip eng insque|| remque 
0 0 U U 








insgue O00 prev] 0 DÜ node 

void insque (void *node, void* prev); 
Remque [] node] [00 D 

void remque (void ode); 


ip_eng | 00000 pre] 00000» 


void ip_enq(struct ipasfragp,* Struct ipasfrag prev); 


ip deg | 0000p 
void ip deq(struct ipasfragp); 


O 10-20 ip reass [000000 






























































232 remo n: China-pubıcom 
—— Hun! 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2; 
367 RFC 1122 (ipq ttl) Net/3 
IP TTL IP TTL 
IP TTL 
TTL 
Net/3 60 (IPFRAGTTL) ip slowtimo 
ipq ttl 1 500 ms ip_slowtimo 
30 IP IP 
ip_slowtimo 
RFC 1122 60-120 
ICMP 
ICMP 64 bit( 8 
) 0 ICMP 
Net/3 Net/3 ICMP 
64 bit 
TCP[] UDP 
8 
3. 
368-375 ip_reass ipq ip. pl| ip id[| ip. src 
ip dst ipq nextl| ipq prev ipq ( 
) q insert([] 10-25) ip 
ip reass ([] 10-21) fp 
C -—"—o— -—À AA Eee ip input.c 
377 * Find a fragment which begins after this one does. 
378 */ 
379 for (q = fp-»ipq next; q !- (struct ipasfrag *) fp; q = q-»ipf next) 
380 if (q-»ip off » ip-»ip off) ` 
381 break; 
———————  —O—.UIip_input,ë 
0 10-21 OO ip reass 0000000000 
376=381 fp for ip off 




































































































































































































































































































































































IP ID 










































































































































































Net/3 IP ID 


















































































































































China-pub.eo " 233 































































































































































































































































































































































































































































































































































































































































































ip output ip id ([] 8-22) 
Net/3 ID IP 
10-22 
10-22 
(earlier) 
0o01 



























E 


[a] AAA j 
R«————— ———— 2 1000111 — 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































U 1022 (] Hn, D ü L1 H D 0 D 13 0 D 0.0 0 1 0 
10-23 
382-396 ip_reass ([] 10-22 
5 ) ( 4) 
( 6) 
ip_input.c 
382 /* pmp 
383 * If there is a preceding fragment, it may provide some of 
384 * our data already. If so, drop the data from the incoming 
385 * fragment. If it provides all of our data, drop us. 
386 */ 
387 if (q->ipf prev != (struct ipasfrag *) fp) { 
388 i = q->ipf prev->ip off + q->ipf prev-»ip len - ip->ip off; 
389 if (i > O) { 
390 if (i >= ip->ip len) 
391 goto dropfrag; 
392 m adj (dtom(ip), i); 
393 ip->ip off += i; 
394 ip->ip len -= i; 
395 } 
396 } a 
ip input.c 
U 10-23 [0 ip reas []U U D UI Ú D 
10-24 
397-412 
( 10-22 2 ) 003 
10-25 
413-426 ip enq 
ipf mff ip_reass 0 
10-26 mbu 
427-440 while m_cat 



















































































































































































































































































234 rem n; Chinarpubscon 
A Mu 


395 E ip input.c 
398 * While we overlap succeeding fragments trim them or, 
399 * if they are completely covered, dequeue them. 
400 Zë 
401 while (q !=(struct ipasfrag *) fp 44 ip->ip_off+ip->ip_len > q->ip_off){ 
402 i = (ip->ip off + ip->ip len) - q->ip_off; 
403 if (i < q-»ip len) { 
404 q-»ip len -= i; 
405 q->ip off += i; 
406 m adj (dtom(q), i); 
407 break; 
408 ) 
409 q = q-»ipf next; 
410 m freem(dtom(q->ipf prev)); 
411 ip deq(q-»ipf prev); 
412 ) .. 
ip input.c 
0 10-24 [][] ip reass DU [0000 
413 insert: tp_input.c 
414 /* 
415 * Stick new fragment in its place; 
416 * check for complete reassembly. 
417 */ 
418 ip_enq (ip, q->ipf_prev); 
419 next = 0; 
420 for (q = fp->ipq_next; q != (struct ipasfrag *) fp; q = q->ipf next) ( 
421 if (q-»ip off !- next) 
422 return (0); 5 
423 next += q->ip_len; 
424 } 
425 if (q->ipf_prev->ipf_mff & 1) 
426 return (0); er 
ip input.c 
U 10-25 DD ip reass [1000 
ip input.c 
427 /* 
428 * Reassembly is complete; concatenate fragments. 
429 tf 
430 q = fp-»ipq next; 
431 m - dtom(q); 
432 t - m-»m next; 
433 m-»m next - 0; 
434 m cat(m, t); 
435 q = q-»ipf next; 
436 while (q !- (struct ipasfrag *) fp) ( 
437 t = dtom(q); 
438 q = q->ipf next; 
439 m cat(m, t); 
440 } er 
ip input.c 


O 10-26 [][] ipreass 000000 











10-27 mbuf[] ipq 
























































































































































ipqt} 








10 IP 












































































































235 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































OG 1 
002 
buf hdr frag | opts 
zai 003 
mbuf nat frag | opts 
\ J m_data 
O 10-27 meat D D 000000 
mbu 
mbuf| 
m data m cat 
208 (2.6[] ) " frag" 
IP 10-18 m data “ opts” 
10-28 20 30 IP 
ipasfrag 10-29 
IP 
4. 
441-456 ip_reass|| ip ipasfrag ip 
ip len ip_src ip_dst 
ipf_mff ( 10-14 ipasfrag ipf. qmff ip 
ipf tos) 
ip reass|[| remque ipq 
m_len|| m data 
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457-464 















































St 
O0:0P00000 


0 1028 000000 


/* 
* Create header for new ip packet by 
* modifying header of first packet; 
* dequeue and discard fragment reassembly header. 
* Make header visible. 
XI 
ip = fp->ipg next; 
ip->ip_len = next; 
ip->ipf_mff &= ^1; 
((struct ip *) ip)->ip_src = fp->ipa_src; 
((struct ip *) ip)->ip_dst = fp-»ipq dst; 
remque (fp); 
(void) m_free(dtom(fp)); 
m = dtom(ip); 
m-»m len += (ip-»ip hl << 2); 
m-»m data -- (ip-»ip.hl «« 2); 
/* some debugging cruft by sklower, below, will go 


ip input.c 


away soon */ 


if (m->m flags & M PKTHDR) ( /* XXX this should be done elsewhere */ 


int plen - 0; 
for (t = m; m; m = m-»m next) 
plen += m-»m len; 
t-»m pkthdr.len - plen; 
) 
return ((struct ip *) ip); 





[] 10-29 [ O ip reass U U H H H 


























































































































for 









































pkthdr.len 








d 








































































































copied 
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10.7 ip_slowtimo|] |] 

































































































































































































































































































































































































































































































































































































































































































































































































































































7.4 Net/3 500 ms [] IP 
ip slowtimo 10-30 
ip input.c 
515 void peu 
516 ip slowtimo (void) 
517 ( ' 
518 struct ipa *fp; 
519 int S = splnet (); 
520 fp = ipq.next; 
521 if (fp == 0) { 
522 splx(s); 
523 return; 
524 } 
525 while (fp != &ipq) { 
526 --fp-»ipq ttl; 
527 fp - fp-»next; 
528 if (fp-»prev-»ipq ttl == 0) { 
529 ipstat.ips fragtimeout++; 
530 ip freef(fp-»prev); 
531 } 
532 } 
533 splx(s); 
534 ) M 
ip input.c 
O 10-30 ip slowtimo [] Ü 
515-534 ip slowtimo TTL 0 
ip freef splnet | ip slowtimo 
| 
ip freef 10-31 
470-486 ip freef fp 
ip input. 
474 void peur 
475 ip freef(fp) 
476 struct ipq *fp; 
477 ( 
478 struct ipasfrag *q, *p; 
479 for (q = fp-»ipq next; q !- (struct ipasfrag +) fp; q = p) ( 
480 p = q-»ipf next; 
481 ip_deq(q); 
482 m freem(dtom(q)); 
483 } 
484 remque (fp); 
485 (void) m free(dtom(fp)); 
486 ) me 
1p_input.c 





O 10-31 ip freef DD 























































































































7-14 IP[] ip drain 
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(U 2-13) ip_drain 10-32 
538 void ip. input.c 
539 ip_drain() 
540 ( 
541 while (ipq.next != &ipq) { 
542 ipstat.ips_fragdropped++; 
543 ip_freef (ipq.next); 
544 } 
545 ) ë 
ip_input.c 
O 10-32 ip drain [][] 
538-545 IP IP TCP 
TCP UDP IP UDP 
108 DI 
ip_output 
ip_reass ipintr 
IP 576 Net/3 
mbu 
ip_slowtimo 
U U 
10.1 ip slowtimo (U 11-1) ICMP 
10.2 
10.3 10-170] ID[] 7 ipq mbu 
10.4 [Auerbach 1994] 
ip_output 
[Auerbach 1994] TCP/IP 



















































































































































































10.5 8-5 


































































































































































































































































































10.6 ip_off 






































































































































ipaa tt 


D 110 


TLI 00 


ICMP]] Internet] 0 0 J J Ü 





ICMP[] IP 



























































IP 

































































ICMP 




































































RFC 792 [Postel 1981b] 
ICMP 























RFC 950 [Mogul 
RFC 792 [Braden 1989a] 











Postel 1985] 

















RFC 1256 [Deering 1991a] 
































ICMP[] [| 
































[] (1) 














IP 








[] ICMP 




































































ICMP 









































































































































IP 







































































IPOD ( ) 


















































8[] 




















































































































































































































TCPO UDP 





































































































11-10 | 



























































ICMP 














0000! 















































| ICMP 












































typel] code 


ICMP_ECHO 
ICMP_ECHOREPLY 





PRC_ 








ICMP_TSAMP 
ICMP_TSTAMPREPLY 





ICMP MASKREQ 
ICMP MASKREPLY 





ICMP IREQ 
ICMP IREQREPLY 





ICMP ROUTERADVERT 
ICMP ROUTESOLICIT 


ICMP REDIRECT 
ICMP REDIRECT NET 
ICMP REDIRECT HOST 
ICMP REDIRECT TOSNET 


U U 


ICMP REDIRECT TOSHOST 








000 
000 
000000 
000000 


DO OD El 
Onnodlooloolooloologo 


=| 
Lo 


= 
o 
a 





PRC_REDIRECT_HOST 
PRC_REDIRECT_HOST 
PRC_REDIRECT_HOST 
PRC 


_REDIRECT_HOST 





ICMP_UNREACH 
ICMP_UNREACH_NET 
ICMP_UNREACH_HOST 



































Oo 
ooo|a 





oo goja 

ess Ala PY A C3 r3 = 

ooo|Oooooøoona 
Co 








PRC_UNREACH_NET 
PRC_UNREACH_HOST 











U 11-1 ICMPD D 0 0 0 0 U 
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se 








typel] code 0 U PRC_ 


ICMP_UNREACH_PROTOCOL 


0000 


PRC_UNREACH_PROTOCOL 
000000 PRC_UNREACH_PORT 
P 
p 


ICMP UNREACH PORT 


ICMP UNREACH SRCFAIL RC UNREACH SRCFAIL 


ICMP UNREACH NEEDFRAG 


0 DFO D RC_MSGSIZE 


ICMP_UNREACH_NET_UNKNOWN PRC_UNREACH_NET 


ICMP_UNREACH_HOST_UNKNOWN REACH_HOST 
ICMP_UNREACH_ISOLATED REACH_HOST 


N 
N 
N 

ICMP_UNREACH_NET_PROHIB 000000 | PRC UNREACH NET 
N 
N 
N 








ICMP_UNREACH_HOST_PROHIB 000000 | PRC_U 
0000 PRC_U 


Dan PRC, U 


REACH HOST 


ICMP UNREACH TOSNET REACH NET 

















ICMP UNREACH TOSHOST REACH HOST 




















































































































































































































































































































































































































13 0000 
14 
15 [] 
UU 
ICMP_TIMXCEED Ooo 
ICMP_TIMXCEED_INTRANS 000001200000 PRC_TIMXCEED_INTRANS 
ICMP_TIMXCEED_REASS 0000000 PRC_TIMXCEED_REASS 
un DU D D 0 
ICMP PRRAMPROB IPD D D 0 H] 
0 0000000 PRC_PARAMPROB 
ICMP_PRRAMPROB_OPTABSENT 000000 PRC_PARAMPROB 
un O00000000 
ICMP SOURCEQUENCH 000000 PRC_QUENCH 
UU DU D DD U 
[| 11-1 (0) 
O 11-1] O 120000000 
*PRC DI Net/3[] 000 UU O (11.60 10 ICMPOOOO0000000 
U 00000 || U U U U 0 0 ICMPI do 
U U D 0 0 0 Ne) U UL D U U 0 D D L] U U 
D 11300000000 1200000000 
*icmp input[][] icmp_input[] O [| ICMPU [1 DB D LH HU D] 









































e UDP[] [| [| UDPO [| [] U ICMP H H HU LH Ll 



























































































































































e TCP[] UU TCP] OOO ICMPEL D D] D D Ú! | U tcp_quenchl] [| ICMP O Ú Ú 
000000 tcp_notifyl] 

e [| U errnol] U U U D 0 0 ICMP LU 

eU U DU ut ti U U U D ICMP [J U U U U 0 0 0 0 0 0 ICMP] ILLU 
U U U U U (DUU 

U Net/30  ICMPO OU IPPO D D D 0 HL BL D DO HH E] D D] D DE. D D D B. 000000 
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ICMP ICMP 
ICMP ICMP ICMP 11-4 











































































































































































































































































































Spe TL Y code ori | pr | Er 


ICMP ECHO icmp reflect 
ICMP ECHOREPLY rip input 
ICMP TSTAMP icmp reflect 
ICMP TSTAMPREPLY rip input 
ICMP MASKREQ icmp reflect 
ICMP MASKREPLY rip input 
ICMP IREQ rip input 
ICMP IREQREPLY rip input 
ICMP ROUTERADVERT rip input 
ICMP ROUTERSOLICIT rip. input 


ICMP REDIRECT 





































































ICMP REDIRECT NET pfctlinput in rtchange | in rtchange 
ICMP REDIRECT HOST pfctlinput in rtchange | in rtchange 
ICMP REDIRECT TOSNET pfctlinput in rtchange | in rtchange 
ICMP REDIRECT TOSHOST pfctlinput in rtchange | in rtchange 


O D rip_input 
ICMP_UNREACH 





































































ICMP_UNREACH_NET pr_ctlinput udp_notify tcp_notify EHOSTUNREACH 
ICMP_UNREACH_HOST pr_ctlinput udp_notify tcp_notify EHOSTUNREACH 
ICMP_UNREACH_PROTOCOL pr_ctlinput udp_notify tcp_notify ECONNREFUSED 
ICMP_UNREACH_PORT pr_ctlinput udp_notify tcp notify ECONNREFUSED 
ICMP_UNREACH_SRCFAIL pr_ctlinput udp_notify tcp notify EHOSTUNREACH 
ICMP UNREACH NEEDFRAG pr ctlinput udp. notify tcp. notify EMSGSIZE 

ICMP UNREACH NET UNKNOWN pr ctlinput udp notify tcp notify EHOSTUNREACH 
ICMP UNREACH HOST UNKNOWN | pr ctlinput udp notify tep notify EHOSTUNREACH 
ICMP UNREACH ISOLATED pr ctlinput udp notify tcp notify EHOSTUNREACH 
ICMP UNREACH NET PROHIB pr.ctlinput udp notify tcp notify EHOSTUNREACH 








EHOSTUNREACH 





ICMP UNREACH HOST PROHIB udp notify tcp notify 





pr ctlinput 

























EHOSTUNREACH 
EHOSTUNREACH 







udp notify 
udp notify 


ICMP UNREACH TOSNET 
ICMP UNREACH TOSHOST 
13 


pr ctlinput 
pr ctlinput 
rip input 


tcp. notify 
tcp notify 

























14 
15 


rip input 
rip input 
rip input 













ICMP TIMXCEED 
ICMP TIMXCEED INTRANS 
ICMP TIMXCEED REASS 


















tcp notify 
top notify 


udp notify 
udp notify 


pr ctlinput 
pr_ctlinput 
rip input 













ICMP_PARAMPROB 
0 
ICMP_PARAMPROB_OPTABSENT 


















ENOPROTOOPT 
ENOPROTOOPT 


tcp_notify 
tcp notify 


udp_notify 
udp_notify 


pr_ctlinput 
pr_ctlinput 
rip_input 


pr_ctlinput udp_notify tcp_quench [Ct 
[upim |  [ o 


[] 11-2 TEMP 000000) 
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icmp reflect TT ICMPO 000 11.120] 
in_rtchange [] E] IP D] FH [] 22-34 
pfetlinput [00000000 7.70 
pr_etlinput D 0 0 DDD 00 DD 00 0 7.40 
rip_input 000000 ICMP[ I 32.50 
tcp notify O0O00000000 [ 27-12 
tcp_quench Hood O 27-13 
udp_notify 000000 0 23-31 
0 11-3 ICMPO IJ IJ J DB D D DJ UJ 
ICMP 0 00 U Ë U U 
DO U ICMP[] D D D D D U D DOD 00 
DO U DDD IP U DDD D 
DO O00000000P|0POOOOOOO 
DO U DDD IP 00000000 
11-4 ICMPO O00 
112 ODO 
[] 11-5 l U U UD U U 0 0 00 CMP D 0 U 0 0 D 0 0 D U U 0 0 U 
U U U U 
netinet/ip icmp.h ICMP] 0 H O 
netinet/ip icmp.c ICMP] [] 
0115 000000 
1121 uüt 
OOOO0000000 11-6000 
U [] U U U U 
icmpmaskrepl | int U ICMPI] D D D D B 0 B  U 0 
icmpstat struct icmpstat ICMPO O (| (0 11-7) 
0116 )JO00000000 
11.2.2 Hm 
ul | U 11-70 U O icmpstat D 0 OL UO ODO 
icmpstat[][] O O SNMP[ UI 
icps_oldicmp U D D D D D D D ICMpD 0 D D 0 D D D 0 . 
icps oldshort D D POOOOOOOOODOOO ° 














gue 00000000 
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icmpstat[][] U [] SNMP] D O 
icps_badcode 000000000 CMD OD . 
icps_badlen 00000 CMP H H H H ICMP O Ü ° 
icps_checksum DO OD ICMPU EH E D DO 00 ICMPTI O O . 
icps tooshort 0 D ICMPD D 0 D 0 D 0 00 0 0 ° 
icps outhist[] | 0000000 -0 0 CMP D 0 D 0 0 > 
icps inhist[] OOOO0000;0010MPOOO0O0O00 ° 
icps_error icmp error 00 (0 D D D DU 
icps reflect 00000 ICMPT O O 

D XI 407 
11-8 netstat -ig 























































































































































netstat -s [| Ú icmpstat [| [] 


84124 calls to icmp_error icps_error 
icps_oldicmp 


0 errors not generated 'cuz old message was icmp 

Output histogram: icps outhist[] 
echo reply: 11770 ICMP ECHOREPLY 
destination unreachable: 84118 ICMP UNREACH 
time exceeded: 6 ICMP TIMXCEED 

6 messages with bad code fields icps badcode 

0 messages « minimum length icps_badlen 

0 bad checksums icps_checksum 

143 messages with bad length icps_tooshort 

icps inhist[] 


Input histogram: 
echo reply: 793 ICMP ECHOREPLY 
destination unreachable: 305869 ICMP UNREACH 
ICMP_SOURCEQUENCH 


source quench: 621 

routing redirect: 103 ICMP_REDIRECT 

echo: 11770 ICMP_ECHO 

time exceeded: 25296 ICMP_TIMXCEED 
11770 message responses generated icps_reflect 










































0 11-8 ICMPO 0000 





11.2.3 SNMP 












































11-9 SNMP ICMP Net/3 


SNMP[ D 


icmpInErrors icps_badcode + 
icps badlen + ICMPO DD 

icps checksum + HB B H ICMPT H g 
icps tooshort 




































































































































icmpInDestUnreachs 

icmpInTimeExcds 

icmpInParmProbs 

icmpInSrcQuenchs 

icmpInRedirects 

icmpInEchos icps inhist[1[l 0 0 





000000 ICMPE 0 0 





D 11-9. ICMPO 0 B. 0 D SNMPO O 
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icmpInEchoReps 
icmpInTimestamps 
icmpInTimestampReps 
icmpInAddrMasks 
icmpInAddrMaskReps 
icmpOutMsgs H U H ICMPH OO 
icmpOutErrors icps oldicmp + 
ic dui DO000000010Mmeg 0 D 
icmpOutDestUnreachs 
icmpOutTimeExcds 
icmpOutParmProbs 
icmpOutSrcQuenchs 
icmpOutRedirects 
icmpOutEchos icps_outhist L) H 0 0 000000 ICMP DD 
icmpOutEchoReps 
icmpOutTimestamps 
icmpOutTimestampReps 
icmpOutAddrMasks 
icmpOutAddrMaskReps 
U 11-9 (U) 
icmpInMsgs[| icps_inhist icmpInErrors icmpOutMsgs 
icps_outist icmpOutErrors 
11.3 icmp|] |] 
Net/3 11-10 icmp ICMP 
42-45 icmp type icmp code ( 11-1 10) 
icmp_cksum IP ICMP (L] IP ) 
46-79 icmp_hun( JO icmp_dun( ) icmp type[] icmp code 
ICMP ICMP[] |] icmp hun[] icmp dun 
0 
80-86 ( mbuf[] le sof£tc[] ether. arp) 
#define 
11-11 ICMP ICMP IP 
ip_icmp.h 
42 struct icmp { p-icmp 
43 u char icmp type; /* type of message, see below */ 
44 u char icmp code; /* type sub code */ 
45 u short icmp cksum; /* ones complement cksum of struct */ 
46 union { 
47 u char ih pptr; /* ICMP PARAMPROB */ 
48 Struct in addr ih gwaddr; /* ICMP REDIRECT */ 
49 struct ih idseq { 
50 n short icd id; 
51 n short icd seq; 
52 ) ih idseq; 
53 int ih void; 
54 /* ICMP UNREACH NEEDFRAG -- Path MTU Discovery (RFC1191) */ 
55 struct ih pmtu { 


011-10 imo D D 
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56 n short ipm void; 

57 n short ipm_nextmtu; 
58 ) ih pmtu; 

59 } icmp hun; 


60 #define icmp pptr icmp hun.ih pptr 

61 #define icmp gwaddr icmp hun.ih gwaddr 

62 #define icmp id icmp hun.ih idseq.icd id 
63 #define icmp seq icmp hun.ih idseq.icd seq 
64 #define icmp void icmp hun.ih void 

65 #define icmp pmvoid icmp, hun.ih, pmtu.ipm void 


66 #define icmp nextmtu icmp hun.ih pmtu.ipm nextmtu 
67 union { 

68 struct id ts ( 

69 n time its otime; 

70 n time its rtime; 

71 n time its ttime; 

72 ) id ts; 

73 struct id ip ( 

74 struct ip idi ip; ji 

75 /* options and then 64 bits of data */ 
76 } id_ip; 

77 u long id mask; 

78 char id_datall]; 

79 } icmp_dun; 


80 #define icmp_otime icmp_dun.id_ts.its_otime 
81 #define icmp_rtime icmp_dun.id_ts.its_rtime 
82 #define icmp_ttime icmp_dun.id_ts.its_ttime 
83 #define icmp_ip icmp_dun.id_ip.idi_ip 

84 #define icmp_mask icmp_dun.id_mask 

85 #define icmp_data icmp_dun.id_data 

86 }; 





ip_icmp.h 
D 14-10 Or? 


ICMP{] 0 


| sun | ML Om CS 
CTI E) E Be, EE SA 


Pg DD 
am 11-11 0 0 ICMPQ [] mu = U im ) 


11.4 ICMP [] protosw[] |] 


























































































































































































































































































































































































































inetsw[4]([] 11-13)] protosw ICMP 
11-12 icmp input ICMP 
ICMP rip output rip 32 
0 0 inetsw[4] [] O 
pr_type SOCK_RAW ICMPOI DO 00000 
pr domain &inetdomain ICMP]] Internet] 0 0 [] O 

















H 11-12 ICMP [] inetsw [J 
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TCP/IP 2 
O 0 inetsw[4] LI O 
pr_protocol IPPROTO_ICMP (1) OOO OOO ip PD D 
pr_flags PR ATOMIC|PR ADDR 000000 ICMPTI O O 
pr_input icmp_input 0 PO OD ICMPTI [J 
pr_output rip_output U ICMPO D D [] PQ 
pr_ctlinput 0 ICMP] DUDU 
pr_ctloutput rip ctloutput U D DD D DD DDD DD D 
pr_usrreq rip usrreg 000000000000 
pr init 0 ICMP DI 
pr_fasttimo 0 ICMP] D D 
pr_slowtimo 0 ICMP DI 
pr_drain 0 ICMP) DD 
pr_sysctl 0 ICMP] DI 
HU (HU) 
ip_protox[]: inetsw[]: 
l 
0 11-13 00010 ipp D O O inetsw[4] 
11.5 00000 icmp_input|] |] 
ipintr IP ip_p ICMP 
ip på 1 ip protox inetsw[4] 
ICMP| | | IP 
inetsw[4][| pr input 
icmp input 
([] 10-11) 
icmp 
input[] ICMP IcCMPO 00000000 
[] 3 icmp input 
ICMP TEMP — 
IP 0000. 
ICMP (O 11-29) 
ICMP 
11-14 U 11-14 ICMPO 000000 
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50 (11.60 11.10) icmp input[] (1) (2) ICMP 
(3) ICMP (4) ICMP (5) ICMP icmp input 
11-15 
ip icmp.c 


131 static struct sockaddr in icmpsrc - ( sizeof (struct sockaddr in), AF INET J; 
132 static struct sockaddr in icmpdst = ( sizeof (struct sockaddr in), AF INET }; 
133 static struct sockaddr in icmpgw = ( sizeof (struct sockaddr in), AF INET }; 
134 struct sockaddr in icmpmask - ( 8, 0 ); 


135 void 
136 icmp input (m, hlen) 
137 struct mbuf *m; 


138 int hlen; 

139 ( 

140 struct icmp *icp; 

141 struct ip *ip - mtod(m, struct ip *); 

142 int icmplen = ip->ip len; 

143 int i; 

144 Struct in ifaddr *ia; 

145 void (*ctlfunc) (int, struct sockaddr +, struct ip Si: 
146 int code; Ñ 
147 extern u_char ip_protox[]; 

148 /* 

149 * Locate icmp structure in mbuf, and check 
150 * that not corrupted and of at least minimum length. 
151 */ 

152 if (icmplen < ICMP_MINLEN) ( 

153 icmpstat.icps_tooshort++; 

154 goto freeit; 

155 } 

156 i = hlen + min(icmplen, ICMP.ADVLENMIN); 

157 if (m->m_len < i && (m = m_pullup(m, i)) == 0) { 
158 icmpstat.icps tooshort++; 

159 return; 

160 ) 

161 ip = mtod(m, struct ip *); 

162 m->m len -= hlen; 

163 m->m data += hlen; 

164 icp = mtod(m, struct icmp *); 

165 if (in cksum(m, icmplen)) ( 

166 icmpstat.icps checksum++; 

167 goto freeit; 

168 ) 

169 m->m len += hlen; 

170 m->m data -= hlen; 

171 if (icp->icmp type > ICMP MAXTYPE) 

172 goto raw; 

173 icmpstat.icps_inhist [icp->icmp_type] ++; 

174 code = icp->icmp code; 

175 switch (icp->icmp type) { 





O 11-15 icmp_ input OO 
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317 default: 

318 break; 
319 ) 

320 raw: 

321 rip input (m); 
322 return; 


323 freeit: 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































324 m freem(m); 
3253 
TH Tr DI icmp.c 
D 11-15 (0) 
1 U 
131-134 icmp_input 
icmp_input | 4 
icmp input 44000 
icmpsrc icmp input 
sockaddr in [] Net/2 icmp input 
raw input IP 
icmpsrc Net/3 rip_input 
raw_input | icmpsrc Net/2[] 0 
2: 
135-139  icmp input ICMP (m) 
IP (hlen) 11-16 | icmp_input 
ICMP 
unu U U U 
ICMP MINLEN 8 ICMPO 0000000 
ICMP_TSLEN 20 ICMPOODDODOOD 
ICMP_MASKLEN 12 ICMPQ 000000 
ICMP ADVLENMIN 36 ICMPID (00100000000 
(IP + ICMP + BADIP = 20 + 8 + 8 = 36) 
ICMP_ADVLEN (p) 36 + optsize ICMP 000000000000 el PO LH D] optsize O 







































































































































































































































































































































































































































































































































































































































































O 11-16 ICMED 0.0 D.0 DD D D D. 0 D 
140-160 icmp_input[] ip len ICMP icmplen 
ipintr[] ip len IP | 
icps tooshort mbu ICMP IP 
m_pullup ICMP IPU U IP mbu 
3.0000 
161-170 icmp input mbu IP in cksum[][] ICMP o 
[| icps_checksum 
4. 

















































































































171-175 (icmp_type) icmp_input switch 






























































CMnaspubetOM un ene mene 249 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































raw ( 11-9) icmp_input icmp_code[] switch 
icmp type 
ICMP switch icmp input[] rip input ICMP 
ICMP [] | ( ) 
ICMP rip_input icmp_input 
raw 
5 ICMP 
317-325 icmp_input[ |] rip_inputl] rip input[] 
(320 ) 
IP ICMP 
° [| ICMP ( 11-28) 
. ICMP ( ping 
traceroute) 
. ICMP 
Mme 000 
ICMP 
11-17 
ICMP 
Hunu void ip 
77 ewe] zm | 0009 Doooonmon 
I 400 l 
= id i 
20 0 200 
ip 
I ! 200 30 0 80 O 
O 11-17 ICMPJO D D (0 0 iem.) 
11-18 11-15 switch 
ip_icmp.c 
176 case ICMP_UNREACH: 
177 switch (code) { 
178 case ICMP_UNREACH_NET: 
179 case ICMP_UNREACH_HOST: 
180 case ICMP_UNREACH_PROTOCOL: 
181 case ICMP_UNREACH_PORT: 
182 case ICMP_UNREACH_SRCFAIL: 
183 code += PRC_UNREACH_NET; 
184 break; 
185 case ICMP_UNREACH_NEEDFRAG: 


O 11-18 icm input DU U 0 0 0 0 U 


250 















































China-pub.com 


ip_icmp.c 





TCP/IP 2 
186 code = PRC_MSGSIZE; . 
187 break; 
188 case ICMP_UNREACH_NET_UNKNOWN: 
189 case ICMP UNREACH NET PROHIB: 
190 case ICMP UNREACH TOSNET: 
191 code = PRC UNREACH, NET; 
192 break; 
193 case ICMP UNREACH HOST UNKNOWN: 
194 case ICMP UNREACH ISOLATED: 
195 case ICMP UNREACH HOST PROHIB: 
196 case ICMP UNREACH TOSHOST: 
197 code = PRC UNREACH HOST; 
198 break; 
199 default: 
200 goto badcode; 
201 } 
202 goto deliver; 
203 case ICMP_TIMXCEED: 
204 if (code > 1) 
205 goto badcode; 
206 code += PRC_TIMXCEED_INTRANS; 
207 goto deliver; 
208 case ICMP_PARAMPROB: 
209 if (code > 1) 
210 goto badcode; 
211 code = PRC_PARAMPROB; 
212 goto deliver; 
213 case ICMP_SOURCEQUENCH: 
214 if (code) 
215 goto badcode; 
216 code = PRC_QUENCH; 
217 deliver: 
218 /* 
219 * Problem with datagram; advise higher level routines. 
220 */ ; 
221 if (icmplen < ICMP_ADVLENMIN || icmplen < ICMP ADVLEN(icp) || 
222 icp->icmp_ip.ip_hl < (sizeof(struct ip) >> 2)) { 
223 icmpstat.icps badlen++; 
224 goto freeit; 
225 } 
226 NTOHS (icp->icmp_ip.ip_len); 
227 icmpsrc.sin_addr = icp->icmp_ip.ip_dst; 
228 if (ctlfunc = inetsw[ip_protox[icp->icmp_ip.ip_p]].pr_ctlinput) 
229 (*ctlfunc) (code, (struct sockaddr *) &icmpsrc, 
230 &icp->icmp ip); 
231 break; 
232 badcode: 
233 icmpstat.icps badcode++; 
234 break; 

O 11-18 (0) 
176-216 ICMP 


icmp_type 


























































































































imcp_input 





































































































icmp_code 




































































P RC 


























N 
> 
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11 ICMP|] Internet|] | 






























































~ 





11-190 UOU PRO l] | | LU U U U 0 ICMP[] code LU U DU U U (U 
HH code] U UU PRC 0 
217-225 icmp input [] deliver[| [| [ [| D DI [] 
icmp_input[] [| [| badcode[] 











































































































































































































u u u icps_badlen|] [] 1 
Net/3 ICMP E | | [] ICMP | 






























































































































































































































































226-231 icmp input[] pr ctlinput | uui 
ip. ell OOD uu uu O IPO (code) IP 
U D u D ( icmpsrc) OGOO0O0000I ( icmp_ip)HU 1 
pr_ctlinput( uguuil ) 23-31 
232-234 100 icps_badcode 1 switch 

















































































































































































































































































































































































































































































































0 H 0 H 


PRC_HOSTDEAD 
PRC_IFDOWN 

PRC MSGSIZE 

PRC PRRAMPROB 

PRC OUENCH 

PRC QUENCH2 

PRC REDIRECT HOST 
PRC REDIRECT NET 

PRC REDIRECT TOSHOST 
PRC REDIRECT TOSNET TOS 
PRC ROUTEDEAD 
PRC TIMXCEED INTRANS 
PRC TIMXCEED REASS 
PRC UNREACH HOST 
PRC UNREACH NET 
PRC UNREACH PORT 

PRC UNREACH PROTOCOL 
PRC UNREACH SRCFAIL 








- 
° 
Un 


UU 
000 













































































021-9 000000 


= 
= 
= 
LJ 



























































PRC | Internet 
00000 Internet] 0 U D U D U D 0 D U psc 000000000 

















































































































































































































1 DODO 


Net/3 l L U I O [] ICMP ICMP rip input 
32 ICMP 
Net/3 ICMP 0 
mbuf[] icmp input [] UDD 



























































































































































































































































































































































































































































252 





















































































































































China-pub.con 














































































































































































































































































































































































































































































































































































































TCP/IP 2 
11.7.1 ICMP ECHO[] ICMP_ECHOREPLY 
ICMP ICMP 
ICMP " ping” ping 
ICMP 1 7 ping 
ping ar ping) 
1 Packet InterNet Groper 
11-20] ICMP 
0 78 15 16 31 


icmp_type 
ICMP_ECHO 
ICMP_ECHOREPLY 


[] 11-20 ICMP H 00090 




















| | 
0 


icmp_id 


000 








icmp_datal] 


0000 


icmp_cksum 

































































































































































































































































































































































































































































































































































icmp_code O[] icmp_id[] icmp seq 
icmp_data 11-21 
ICMP icmp_input ICMP 
ip icmp.c 
235 case ICMP ECHO: 
236 icp->icmp type = ICMP ECHOREPLY; 
237 goto reflect; 
277 reflect: 
278 ip-»ip len += hlen; /* since ip input deducts this */ 
279 icmpstat.icps reflect++; 
280 icmpstat.icps_outhist [icp->icmp_type]++; 
281 icmp_reflect (m); 
282 return; "n 
, ip icmp.c 
U 11-21. ice input 0200000000 
235-237 icmp type ICMP ECHOREPLY reflect 
icmp input 
277-282 ICMP icmp input reflect 






















































































































































































ICMP 






































icps reflect(11.12 








icps reflect 











icps outhist[] 
























































) 




















































































































(00 UA `. 253 









































































































































11.72 ICMP_TSTAMP| | ICMP TSTAMPREPLY 
ICMP[] | 11-22 
0 78 15 16 31 
1cmp type icmp code icmp cksum 





ICMP_TSTAMP 0 
ICMP_TSTAMPREPLY Hu 


icmp id icmp seq 
U 0 0 oO 


icmp_otime 


2000 


icmp rti 


2000 


32000 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































O 11-22 ICMP[] D B D 0 D D 0 
icmp code O[] icmp id[] icmp seq ICMP 
icmp_otime ( )U icmp_rtime ( ) 
icmp_ttime( ) UTC 
IP 
11-23 
ip icmp.c 
238 case ICMP TSTAMP: 
239 if (icmplen < ICMP_TSLEN) { 
240 icmpstat.icps_badlen++; 
241 break; 
242 } 
243 icp->icmp_type = ICMP_TSTAMPREPLY; 
244 icp->icmp_rtime = iptime(); 
245 icp->icmp_ttime = icp->icmp_rtime; /* bogus, do later! */ 
246 goto reflect; WA 
ip icmp.c 
O 11-23 impinput D 0 U 00 0 00 00 U 
238-246 icmp_input[] ICMP icmp_type ICMP_TSTAMPREPLY 
icmp rtime[] icmp_ttimel] [| reflect 
icmp_rtimel] icmp_ttime IP 
icmp rtime 
icmp ttime 
ICMP ( 11.8) 
1128 ICMP MASKREO[] ICMP_MASKREPLY 
ICMP 11-24 























































































































































































































RFC 950 [Mogul[] Postel 1985] ICMP 






































































































































254 reren 02 China=pubecom 
A | 























RFC 1122 


















































































































































































































































































































































































































































Lomp type icmp. code icmp cksum 
ICMP MASKREQ 0 000 


ICMP MASKREOREPLY 


icmp_seq 


U 0 U 


icmp mask 


200000 




























































































































































































































































































































































































































































































































































































0 11-24 ICMP[] [00000000 
icmpmaskrepl Net/3 icmpmaskrepl 
Of] icmp sysctl systctl(8) (11.14(] ) 
Net/2 
Net/2 
11-25 
ip icmp.c 
247 Case ICMP MASKREQ: 
248 #define satosin(sa) ((struct sockaddr in *)(sa)) 
249 if (icmpmaskrepl -- 0) 
250 break; 
251 /* 
252 * We are not able to respond with all ones broadcast 
253 * unless we receive it over a point-to-point interface. 
254 */ 
255 if (icmplen < ICMP_MASKLEN) 
256 break; 
257 switch (ip->ip_dst.s_addr) { 
258 case INADDR_BROADCAST: 
259 case INADDR_ANY: 
260 icmpdst.sin addr = ip->ip_src; 
261 break; 
262 default: 
263 icmpdst.sin addr = ip->ip_dst; 
264 } 
265 ia = (struct in_ifaddr *) ifaof_ifpforaddr ( 
266 (struct sockaddr +) &icmpdst, m->m_pkthdr.rcvif); 
267 if (ia == 0) 
268 break; 
269 icp->icmp_type = ICMP_MASKREPLY; 
270 icp->icmp mask = ia->ia sockmask.sin addr.s addr; - 
271 if (ip->ip src.s, addr == 0) { . 
272 if (ia-»ia ifp-»if flags & IFF BROADCAST) 
273 ip-»ip src = satosin(&ia-»ia broadaddr)->sin addr; 
274 else if (ia-»ia ifp->if flags & IFF_POINTOPOINT) 
275 ip-»ip src = satosin(&ia-»ia dstaddr)-»sin addr: 
276 } 





ip icmp.c 


D 11-25 icp inet 100000000000 











Il] ICMP 























Internet 
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247-256 0 switch 
rip input UU 11-15) 
Net/3 icps badlen ICMP 
icps badlen 
1. 
257-267 0.0.0.0[] 255.255.255.255 icmpdst 
ifaof_offoraddr|| icmpdst in ofaddr 
0.0.0.0[] 255.255.255.255[] ifaof offoraddr 
IP 
default ( )l| ifaof ifpforaddr 
2. 
269-270 icmp type g | ia sockmask | icmp mask 
3. 
271-276 o(“ ” 
RFC 1122) Net/3 
L | U L 
ia broadaddr|| ia_dstaddr|| icmp input ip src 
reflect ( 11-21) 
11.7.4 ICMP IREQ[] ICMP_IREQREPLY 
ICMP 0 
IP 
RFC 1122 ICMP RARP(RFC 903 [Finlayson et al. 
1984])] BOOTP(RFC 951 [Croft[] Gilmore 1985]) RFC 1541 [Droms 1993] 
( Dynamic Host Configuration Protocol[] DHCP) 
BOOTP | | 
Net/2 ICMP Net/3 rip input 
1173 [JH ICMP ROUTERADVERT[] ICMP_ROUTERSOLICIT 
RFC 1256 [] O [| ICMP Net/3 rip input 
1[] 9.6 
118 I0000 
11-26 ICMP 
icmp input case[] ICMP_REDIRECT 8.5 






































































































































256 





China-pubecon 


TCP/IP 2 













































































































































































































































































ICMP 
































































































































0 7 
icmp_type 
ICMP_REDIRECT 


15 16 31 


8 
icmp_code icmp_cksum T 
0-3 U D D 
800 
icmp_gwaddr 
000000 roo | Jr 


icmp ip 









mo D 0000000 r000000000 sii 


D 11-26 ICMPO 0000 


















































































































































































































































































































































































































































































































































































































































11-27 icmp input 
ip_icmp.c 
283 case ICMP_REDIRECT: 
284 if (code > 3) 
285 goto badcode; 
286 if (icmplen < ICMP_ADVLENMIN || icmplen < ICMP ADVLEN(icp) || 
287 icp->icmp_ip.ip_hl < (sizeof(struct ip) >> 2)) { 
288 icmpstat.icps badlen++; 
289 break; 
290 } 
291 ja 
292 * Short circuit routing redirects to force 
293 * immediate change in the kernel’s routing 
294 * tables. The message is also handed to anyone 
295 * listening on a raw socket (e.g. the routing 
296 * daemon for use in updating its tables). 
297 */ 
298 icmpgw.sin addr = ip->ip src; 
299 icmpdst.sin addr = icp->icmp gwaddr; 
300 icmpsrc.sin_addr = icp->icmp ip.ip dst; 
301 rtredirect((struct sockaddr *) &icmpsrc, 
302 (struct sockaddr *) &icmpdst, 
303 (struct sockaddr *) 0, RTF GATEWAY | RTF HOST, 
304 (struct sockaddr *) &icmpgw, (struct rtentry **) 0); 
305 pfctlinput (PRC REDIRECT HOST, (struct sockaddr *) &icmpsrc); 
306 break; M 
ID icmp.c 
D 11-27. icm input DD D U 0 D LI (Ll 
1. 
283-290 ICMP icmp_input badcode([] 11- 
180 2320 ) IP switch 
11-16 ICMP 36(ICMP_ADVLENMIN)[] ICMP_ADVLEN(icp) 
icp IP ICMP 
291-300 icmp input ( ) 
( ) icmpgw[] icmpdst 






















































































































































































icmpsrc 























11 

















257 








ICMP[] Internet 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































icmpsrc 
sockaddr 
2. 
301-306 Net/3 RFC 1122 
rtredirect ( icmpsrc) 
pfcetlinput] U (730 ) 
RFC 1122 
RFC 1009 
Net/3 
ICMP IP 
18 IP] [| 
119 l 
| ICMP ICMP | 
| | ICMP | I ICMP 
rip_input 
ip icmp.c 
307 FE 
308 * No kernel processing for the following; 
309 * just fall through to send to raw listener. 
310 WA 
311 case ICMP_ECHOREPLY: 
312 case ICMP_ROUTERADVERT: 
313 case ICMP_ROUTERSOLICIT: 
314 case ICMP_TSTAMPREPLY: 
315 case ICMP IREQREPLY: 
316 case ICMP MASKREPLY: 
317 default: 
318 break; 
319 } 
320 raw: 
321 rip_input (m); 
322 return; . 
ip icmp.c 
U 11-28. ice input [I IBD B D 
307-322 ICMP| raw| switch| 
11-15) switch default ( ICMP| ) raw| 
1110 JIDD 
ICMP| 8 IP icmp error ICMP 
icmp reflect ICMP ICMP 
ICMP 11-29 ICMP 






















































































































































































258 TCP/IP 2 China-pubıcom 
AA H 





ICMPT] [] 








IPD D D 0 D U 





ICMP] [] 


(0 11-15) 


D 11-29 ICMPOO OO 




































































































































































































































































11.11 icmp_error[] [] 
icmp_errorl] IP ICMP 

icmp reflect 
16 void ip icmp.c 
47 icmp error(n, type, code, dest, destifp) 
48 struct mbuf *n; 
49 int type, code; 
50 n long dest; 
51 struct ifnet *destifp; 
52 { 
53 struct ip *oip = mtod(n, struct ip *), *nip; 
54 unsigned oiplen = oip->ip_hl << 2; 
55 struct icmp *icp; 
56 struct mbuf *m; 
57 unsigned icmplen; 
58 if (type != ICMP_REDIRECT) 
59 icmpstat.icps_error++; 
60 /* 
61 * Don't send error if not the first fragment of message. 
62 * Don't error if the old packet protocol was ICMP 
63 * error message, only known informational types. 
64 */ 
65 if (oip->ip_off & “(IP MF | IP_DF)) 
66 goto freeit; S 
67 if (oip->ip_p == IPPROTO_ICMP && type != ICMP_REDIRECT && 
68 n->m_len >= oiplen + ICMP_MINLEN && 
69 !ICMP INFOTYPE(((struct icmp *) ((caddr_t) oip + oiplen))-»icmp type))( 
70 icmpstat.icps_oldicmp++; 
71 goto freeit; 
72 } 
73 /* Don’t send error in response to a multicast or broadcast packet */ 
74 if (n->m_flags & (M_BCAST | M_MCAST)) 
75 goto freeit; 





ip icmp.c 


0 11-30 icm error DD DD D 











Cha me 259 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































. ( 11-30) 
. UU 11-32) 
. (U 11-33) 
46-57 n typel] code[] ICMP 
dest[] ICMP destifp IP 
mtod n oipl] oip ip IP 
ioplen 
58-75  icps error | | ICMP Net/3 
icps error SNMP 
icmp error oip 
«[] IP MF[] IP DF ip off ( 11.10) oip 
ICMP 
° ICMP icmp_type[] ICMP 
ICMP_INFOTYPE icmp_type ICMP_INFOTYPE 
Net/3| ICMP RFC 1122 | 
° (O M_BCAST[] M_MCAST] J] ) 
ICMP 
. IP IP 
. IP ( 
E ) 
Net/3 icmp reflect (11.121 ) 
Net/2[] Deering Net/3 
Deering 
ICMP 
ICMP ICMP RFC 1122[] RFC 1127 
Net/3 
ip_output ICMP ( 11-39) 
11-311] ICMP 
11-32 
76-106 icmp_error ICMP 
*m_gethdr MH_ALIGN | 
ICMP IP! ( ) 8 | 
*icmp type[] icmp_code[] icmp_gwaddr( JO icmp_pptr( 
JO icmp_nextmtu( ) icmp_nextmtu RFC 
1191 11] 24.2 = MTU " 
































































































































































































































ICMPI] [] | 11-33 
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D 11-31 ICMPO 000000 
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= Fr ip icmp.c 
77 * First, formulate icmp message 

78 SZ 

79 m = m_gethdr (M_DONTWAIT, MT HEADER); 

80 if (m == NULL) 

81 goto freeit; 

82 icmplen = oiplen + min(8, oip->ip len); 

83 m->m len = icmplen + ICMP MINLEN; 

84 MH ALIGN (m, m-»m len); 

85 icp = mtod(m, struct icmp *); 

86 if ((u int) type > ICMP MAXTYPE) 

87 panic("icmp error"); 

88 icmpstat.icps_outhist [type] ++; 

89 icp->icmp_type = type; 

90 if (type == ICMP_REDIRECT) 

91 icp->icmp_gwaddr.s_addr = dest; 

92 else { 

93 icp->icmp_void = 0; 

94 ZS 

95 * The following assignments assume an overlay with the 

96 * zeroed icmp_void field. 

97 */ 

98 if (type == ICMP_PARAMPROB) { 

99 icp->icmp pptr = code; 
100 code = 0; 
101 ) else if (type == ICMP UNREACH && 
102 code == ICMP_UNREACH_NEEDFRAG && destifp) ( 

103 icp->icmp nextmtu = htons(destifp->if_mtu); 
104 } 
105 } 
106 icp->icmp_code = code; Ne 
ip_icmp.c 
D 11-32 iem error 0000000090 
107-125 IP ( icmplen ) ICMP| 
ip len 
udp usrreq UDP ip len 
ICMP IP 
Net/2 Net/1 
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I SE ip_icmp.c 
107 beopy ((caddr_t) oip, (caddr_t) & icp->icmp_ip, icmplen); 
108 nip = &icp->icmp_ip; 
109 nip->ip_len = htons((u short) (nip->ip_len + oiplen)); 
110 zi 
111 * Now, copy old ip header (without options) 
112 * in front of icmp message. 
113 */ 
114 if (m->m data - sizeof(struct ip) < m->m_pktdat) 
115 panic("icmp len"); 
116 m->m_data -= sizeof(struct ip); 
117 m->m_len += sizeof (struct ip); 
118 m->m_pkthdr.len = m->m_len; 
119 m->m_pkthdr.rcvif = n->m_pkthär.rcvif; 
120 nip = mtod(m, struct ip *); 
121 bcopy ((caddr_t) oip, (caddr_t) nip, sizeof(struct ip)); 
122 nip->ip_len = m->m_len; 
123 nip->ip_hl = sizeof(struct ip) >> 2; 
124 nip->ip_p = IPPROTO_ICMP; 
125 nip->ip_tos = 0; 
126 icmp reflect (m); 
127 freeit: 
128 m freem(n); 
129 3 E 
ip icmp.c 
[| 11-33 imm error DO U D D U B U LI D 
MH ALIGN[] ICMP 
IP IP ( ) ICMP 
Net/2 bcopy oiplen 
(ip len) (ip hl) (ip pI O IP 
TOS (ip tos) 
RFC 792[] RFC 1122 ICMP TOS 0 
126-129 icmp_reflect icmp_reflect 
11.12 icmp reflect[|[] 
icmp reflect[] ICMP 
icmp reflect ICMP 
11-34 
icmp reflect 
11-35 
1. 
329-345  icmp reflect ip. dst 
ip sro ip der icmp_error|| icmp reflect ip src 






























































































































































ip output 
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0 U 0 U 
icmp input O0O00000000000000000000000 000 
icmp_error I000000000000000000000000000000 mnn nn 
PIIOOOOODOOOOOGOOOO 
icmp reflect I0000000000000000000 
I000000000000000000000000000000000000 
00000 
I0O000000000 
ip output D D CME D 0 0 0 0.0 D D D 00 0 0 D 0.0 D D D D D D 0 D 0 D D 0 0.0 D D 
00) 
U 11-34 ICMPO 000000 
Z; 
346-371 icmp_reflect|| in ifaddr 





































































































































































































icmp reflect 















































































































































































































































































































































































































































































































































































































































































































































































































































in ifaddr in ifaddr ( IP ) 
ip_src]] [I ip ttl[][] 255(MAXTTL) 
RFC 1700 IP TTL 64 ICMP 
TTL 255 
TTL TTL 
( ) TTL 
329 void PAA 


330 icmp reflect (m) 
331 struct mbuf *m; 


332 L 

333 struct ip *ip = mtod(m, struct ip +); 

334 struct in ifaddr *ia; 

335 struct in_addr t; 

336 struct mbuf *opts = 0, *ip srcroute(); 

337 int optlen = (ip->ip hl << 2) - sizeof (struct ip); 
338 if (in canforward(ip-»ip src) Eë 

339 ((ntohl(ip-»ip src.s addr) & IN CLASSA NET) != 

340 (IN LOOPBACKNET «« IN CLASSA NSHIFT))) ( 

341 m freem(m); /* Bad return address */ 
342 goto done; /* Ip output() will check for broadcast */ 
343 } 

344 t = ip->ip_dst; 

345 ip->ip_dst = ip->ip_src; 

346 JE 

347 * If the incoming packet was addressed directly to us, 
348 * use dst as the src for the reply. Otherwise (broadcast 
349 * or anonymous), use the address which corresponds 

350 * to the incoming interface. 

351 WI 

352 for (ia = in_ifaddr; ia; ia = ia->ia_next) { 


DH 11-35 icmp reflect 0000000 


Ch 
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353 if (t.s addr == IA SIN(ia)-»sin addr.s, addr) 

354 break; 

355 if ((ia-»ia ifp->if flags & IFF BROADCAST) && 

356 t.s addr == satosin(&ia->ia broadaddr)-»sin addr.s addr) 

357 break; 

358 } 

359 icmpdst.sin_addr = t; 

360 if (ia == (struct in_ifaddr *) 0) 

361 ia = (struct in ifaddr +) ifaof_ifpforaddr ( 

362 (struct sockaddr *) &icmpdst, m-»m pkthdr.rcvif); 

363 /* 

364 * The following happens if the packet was not addressed to us, 

365 * and was received on an interface with no IP address. 

366 */ 

367 if (ia == (struct in ifaddr +) 0) 

368 ia = in ifaddr; 

369 t = IA SIN(ia)->sin addr; 

370 ip->ip src = t; 

371 ip->ip_ttl = MAXTTL; "m 

ip icmp.c 
0 11-35 (O) 
RFC 1122 
RFC 
122 ICMP Net/3 
icmp reflect([] 11-21) 
(0 11-36)]] ICMP 

372 if (optlen » 0) ( PENGE 

373 u char *cp; 

374 int opt, cnt; 

375 u int len; 

376 /* 

377 * Retrieve any source routing from the incoming packet; 

378 * add on any record-route or timestamp options. 

379 */ 

380 cp = (u char *) (ip + 1); 

381 if ((opts = ip sreroute()) == 0 && 

382 (opts = m gethdr(M DONTWAIT, MT HEADER))) { 

383 opts->m len = sizeof(struct in addr); 

384 mtod(opts, struct in_addr *)->s addr = 0; 

385 } 

386 if (opts) { 

387 for (ent = optlen; ent > 0; cnt -= len, cp += len) { 

388 opt = cp[IPOPT_OPTVAL]; 

389 if (opt == IPOPT EOL) 

390 break; 

391 if (opt == IPOPT_NOP) 

392 len = 1; 

393 else { 

394 len = cp[IPOPT OLEN]; 

395 if (len <= 0 || len > cnt) 

396 break; 

397 } 

398 /* 


[] 11-36 icm reflect 0000000 
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399 * Should check for overflow, but it "can’t happen" 
400 */ + 
401 if (opt == IPOPT_RR || opt == IPOPT_TS || 
402 opt == IPOPT_SECURITY) 
403 bcopy ( (caddr_t) cp, 
404 mtod(opts, caddr_t) + opts->m_len, len); 
405 opts->m_len += len; 
406 } 
407 } 
408 /* Terminate & pad, if necessary */ 
409 if (ent = opts->m_len % 4) { 
410 for (; ent < 4; cnt++) I 
411 X (mtod(opts, caddr t) + opts-»m len) = 
412 IPOPT EOL; 
413 opts-»m len++; 
414 } 
415 } 
416 } 
-ip icmp.c 
O 11-36 (O) 
3. 
372-385 4300 (0 11-37)] icmp error 
icmp_reflect IP 
icmp reflect[] ICMP 
cp ip srcroute ipintr 
ip srcoute 0 icmp reflect 
mbuf ipoption 
4. 
386-416 opts for IP ip_srcroute 
ICMP 11-37 
PE) a ip_icmp.c 
418 * Now strip out original options by copying rest of first 
419 * mbuf’s data back, and adjust the IP length. 
420 */ 
421 ip->ip len -= optlen; 
422 ip->ip hl = sizeof(struct ip) >> 2; 
423 m->m len -= optlen; 
424 if (m->m flags & M PKTHDR) 
425 m->m pkthdr.len -= optlen; 
426 optlen += sizeof (struct ip); 
427 bcopy ((caddr_t) ip + optlen, (caddr t) (ip + 1), 
428 (unsigned) (m->m len - sizeof(struct ip))); 
429 } 
430 m-»m flags &= "(M BCAST | M_MCAST); 
431 icmp send(m, opts); 
432 done: 
433 if (opts) 
434 (void) m free(opts); 
435 ] zc SE 
ip icmp.c 


U 11-37 iemp reflect 00000000 
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5. 
417-429 icmp reflect[] ICMP IP 
11-38 opts mbu ip output 
6. 
430-435 icmp send 
UU 








FE 
bcopyl] U o er ere ert 0) | nn | 



































beopyl] 0 D ya IP] DO OD 











































































































































































































































































































[] 11-38 icmp reflect 000090 


11.13 icmp send[|[] 








icmp send([] 11-39) ICMP IP ICMP 
















































































































































































440 void Ta 
441 icmp_send(m, opts) 

442 struct mbuf *m; 

443 struct mbuf *opts; 




































































































































































































































































































































































































































































444 { 
445 struct ip tip = mtod(m, struct ip *); 
446 int hlen; 
447 struct icmp *icp; 
448 hlen = ip->ip_hl << 2; 
. 449 m->m data += hlen; 
450 m->m len -= hlen; 
451 icp = mtod(m, struct icmp *); 
452 icp->icmp cksum = 0; 
453 icp->icmp_cksum = in cksum(m, ip->ip_len - hlen); 
454 m->m_data -= hlen; 
455 m->m_len += hlen; 
456 (void) ip_output (m, opts, NULL, 0, NULL); 
457 } - 
ip icmp.c 
O 11-39 jem send {J JJ 
440-457 icmp input ICMP Net/3 IP 
in cksum ICMP icmp cksum 
ip output[] ICMP icmp send 
ip output (O 4 ) IP ALLOWBROADCAST 
ip output ICMP ( 
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11.14 icmp_sysctl|] |] 





IP[] icmp sysctl 


China-pub.com 








11-40 






























































































































































sysctl 

















Sysct1[] [] 


ICMPCTL_MASKREPL 











icmpmaskrepl 















000000 CMpD D d B B D 














11-41 


























icmp sysctl 





467 int 


468 icmp sysctl (name, namelen, oldp, 


469 int 
470 u in 
471 void 


*name; 
t namelen; 
*oldp; 


472 size_t *oldlenp; 


473 void 


*newp; 


474 size_t newlen; 


475 I 


476 
477 
478 


479 
480 
481 
482 
483 
484 
485 
486 ) 


467-478 
479-486 


icmpmaskrepl[] |] 


11,18. 1] 


O 11-40 icmp_sysct1 [| U 


























oldlenp, newp, newlen) 


/* All sysctl names at this level are terminal. */ 
if (namelen != 1) 
return (ENOTDIR); 


switch (name[0]) { 
case ICMPCTL_MASKREPL: 


return (sysctl_int (oldp, 


default: 


return (ENOPROTOOPT) ; 


} 


/* NOTREACHED */ 


oldlenp, newp, newlen, 


[] 11-41 icmp_sysct1 [| U 
































ICMP sysctl 











ENOTDIR 


























ICMP 

































































































































































O 





E 


NOPROTOOPT 














ip_icmp.c 


&icmpmaskrepl)); 


ip icmp.c 











sysctl int 














ICMP 


IP 






































IP 























ICMP 
















































































ICMP 


















































































































































































































































23.9[] 27.6 

















UDP[] TCP 
























































ICMP 
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0.0.0.0 












































ICMP 














































































































11 








ICMP 





Internet! 
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11.4 


11.5 


11.6 


11.7 
11.8 


11.9 


11.10 
11.11 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































RFC 1122 
ICMP 
ICMP icmp_inout rip_input 
Net/3 IP O ICMP] O 0 0 0 
[] IP U U 
11-25[] ifaof ifpforaddr 
ICMP 
ICMP icmp rtime 
ICMP[ | U 
| 
icmp error[] [| ICMP 640 0 (O Solaris 2.x ) 
11-30 ip_off | 
11-39 ip output 
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[12] IP [] [j 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































12.1 OUH 
8 DI IP (224.0.0.0[] 239.255.255.255) 
D (multicast group) D 
Internet 
{ } 
IGMP (U 130 ) 
(U 140 ) DVMRP(Distance Vector Multicast Routing Protocol 
) IP! 
FDDI Net/3 
ifnet (U 3-7) if_flags IFF_MULTICAST 
Net/3 
IP SLIP 
IP RFC 
1122 IP! 
RFC 1112 [Deering 1989] 
0 IP 
D 

1 IP! 

IP 

IP 

2 IP 

IP IGMP 

Net/3 2 IP 
Net/3 
IP 






































IANA (Internet Assigned Numbers 





































































































UDP[] TCP 
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Authority) IP RFC 1700 IANA 
RFC 1700 12-1 
O O O Net/3[] Ü 
224.0.0.0 00 INADDR UNSPEC GROUP 
224.0.0.1 000000000 INADDR_ALLHOSTS_GROUP 
224.0.0.2 I0O000000000 
224.0.0.3 uut INADDR MAX LOCAL GROUP 
224.0.0.4 DVMRP] UI 
224.0.0.255 0000 
224.0.1.1 NTP Bj B B D 
224.0.1.2 SGI-Dogfight 
0121 00000 IPHD D 
256 (224.0.0.0[] 224.0.0.255) IP 
IP TTL 
RFC 1075 224.0.0.0 224.0.0.1 
mrouted 224.0.0.0(TNADDR UNSPEC GROUP) 
224.0.0.255(INADDR MAX LOCAL GROUP) 
2 (U 6-17) 
224.0.0.1[] (INADDR_ALLHOSTS_GROUP) 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































224.0.0.2 ICMP 
224.0.0.2(" d )[] 224.0.0.1(“ 7 ) 
(255.255.255.255) 
224.0.0.4 DVMRP 
256 (224.0.1.0~239.255.255.255) 
12-1 (224.0.1.1)[] SGI- 
Dogfight(224.0.1.2) 
Internet UDP 
































































































































































































































122 000 




















IP 12-2 
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IO 020 
O U [] O 

net/if_either.h O000000000000 
netinet/in.h O D Internet] 00000 
netinet/in_var.h Internet] 000000000 
netinet/ip_var.h LIP B B UO U U 
net/if ethersubr.c DU U D 000 
netinet/in.c 000090 
netinet/ip input.c 000000 
netinet/ip output.c 00000 

[12-2 DOOO000 

12.2.1 
| ([] 12-3) 




























































































D H 0000 0 H 


ether_ipmulticast_min | u_char [] OPOOOOOOOOOOOO 
ether ipmulticast max | u_char [] OPOOOOOOOOOOOO 


ip mrouter struct socket OO00000000000000000 
0123 J00000000 








































































































































































































































































































































































































































































































































































































































































































































































































1222 In 
Ht | ipstat 
ipstat] Ü O O 
ips_forward 000000000090 
ips cantforward | [00000000000 —0 00000000 
ips_noroute O000000000000000000 
0124 DO DO D D 
I U U D ifnetO [Dl (U 4-5) IP| Hi | 
12.3 UU D] D] U LI U 
IP 0 0 O IP uu 
u UU IP[] D D] C] ED] D] D D D] 0 0 UU 
= IPh nn M = = = 
0 IP 
SLIP 
u U U IU | i | U LU | u 
0 0 | 802.3 O IQ 
4-12 
U U U U D LL tlt U U UD U U U U U U 00 U U 
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IP 
IEEE 
IEEE IANA IP| 01:00:5e 
00:00:5e IANA 
12-5 DI] IP! 
Ki N På - 
01:00:5e 
IANA[ D 0 K— —— 390 DD roo — 
OO000 
012-5 PIOOOOOOODOOO 
12-5 O DJ IP [] Ú 
9 32[] IP ( 12.3) 12.14 
12-6 Net/3 
61 #define ETHER MAP IP MULTICAST(ipaddr, enaddr) \ f_ether.h 
62 /* struct in addr *ipaddr; */ N 
63 /* u char enaddr [6]; */ ÓN 
64 { \ 
65 (enaddr) [0] = 0x01; \ 
66 (enaddr) [1] = 0x00; \ 
67 (enaddr) [2] = Ox5e; ^ 
68 (enaddr) [3] = ((u char *)ipaddr)[1] & Ox7f; \ 
69 (enaddr) [4] = ((u char *)ipaddr) [2]; \ 
70 (enaddr) [5] = ((u_char *)ipaddr) [3]; \ 
71 ) 
if ether.h 
[] 12-6 ETHER MAP IP MULTICAST i 
IP| 
61-71 ETHER MAP IP MULTICAST 12-5 ipaddr D 
enaddr 6 3 
0x01[] OxOO[] Ox5e 0 DI] IP 23 
12.4 ether_multil[] [] 
Net/3 
IP 





































































































































































































































































































ether_multi (U 12-7) 










































































SE onum China-pubıcom 
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if_ether.h 
147 struct ether_multi { 
148 u_char enm_addrlo[6]; /* low or only address of range */ 
149 u char enm addrhi [6]; /* high or only address of range */ 
150 struct arpcom *enm_ac; /* back pointer to arpcom */ 
151 u int enm_refcount; /* no. claims to this addr/range */ 
152 struct ether multi *enm next; /* ptr to next ether multi */ 
153 }; . 
if_ether.h 
O 12-7 ether muti [| [| 
1. 
147-153 enm_addrlo|| enm addrhi 
enm addrlo[| enm addrhi ether multi 
arpcom ([] 3-26) ARP — arpcom 
Net/3 
enm ac arpcom enm refcount ether multi 
0 arpcom enm next ether multi 
12-8 ether multi le softc[0] 
ifnet 
le softc[0]: 
ifnet{} 
arpcom{} 
ether multi() ether multi{} ether multi() 
12-8 000 ether miti [| O [| LANCE] O 
12-8 
. 224.0.0.1( )[] 224.0.0.2( ) 
224.0.1.2(SGI-dogfight) IP 
IP 225.0.0.1 
225.0.0.2[] 226.0.1.2 
. enm ac ehter multi 
*ether multi 
12-9 ETHER LOOKUP MULTI ether multi 
2. 
166-177 addrlol| addrhi ac arpcom 
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for enm_addrlo|| enm_addrhi 



























































































































































































































































addrlo[] addrhi enm 
























































ether multi 




















































































































































































































































































































































































































































































































































































































































































































166 #define ETHER LOOKUP MULTI (addrlo, addrhi, ac, enm) V ff ether.h 
167 /* u_char addrlo[6]; */ \ 
168 /* u char addrhi[6]; */ \ 
169 /* struct arpcom *ac; */ V 
170 /* struct ether multi *enm; */ N 
171 ( \ 
172 for ((enm) = (ac)-»ac multiaddrs; \ 
173 (enm) != NULL && \ 
174 f (bcmp((enm)->enm addrlo, (addrlo), 6) != 0 II A 
175 bcmp ( (enm) ->enm_addrhi, (addrhi), 6) != 0); V 
176 (enm) = (enm)->enm next); \ š 
177 3 l 
if ether.h 
O 12-9 ETHER LOOKUP MULTI |] 
12.5 0 HU U U UT 
IP Net/3 
IP 
12-10 ioctl 
U U [] U [] [] [] [] 
SIOCADDMULT struct ifreq fy ifioctl [00000000000 
SIOCDELMULTI | struct ifreq f ifioctl [00000000000 
O 12-10 OD ioctl DJ 
ifioctl([] 12-11) ifreq (O 6-12) 
if.c 
440 case SIOCADDMULTI: 
441 case SIOCDELMULTI: 
442 if (error = suser(p->p ucred, &p->p_acflag) ) 
443 return (error); : 
444 if (ifp->if_ioctl == NULL) 
445 return (EOPNOTSUPP) ; 
446 return ((*ifp->if_ioctl) (ifp, cmd, data)); ifc 
0 12-11 ifiocti 000000 
440—446 if ioctl ifioctl 







































































































































































































































































12.6 in multi] |] 





12.4 IP 
IP IP 
IP in_ifaddr 6.5 
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Net/3 IP IP 
12-12 in_multi IP ( } 
in_var.h 
111 struct in_multi { 
112 struct in_addr inm_addr; /* IP multicast address */ 
113 struct ifnet *inm_ifp; /* back pointer to ifnet */ 
114 struct in_ifaddr *inm_ia; /* back pointer to in ifaddr */ 
115 u int inm refcount; /* no. membership claims by sockets */ 
116 u int inm timer; /* IGMP membership report timer */ 
117 struct in multi *inm next; /* ptr to next multicast address */ 
118 }; å 
in var.h 
O 12-12 in multi Un 
1. IP 
111-118 inm_addr D (UY 224.0.0.1 VT inm ifp 
ifnet inm ia in ifaddr 
( } 
in_multi 
inm_refcount 
inm_refcount O[] in multi 
ether multi 0 
inm timer 13 IGMP inm next 
in multi 
12-13 le softc[0] IP 
ifnet 
le_softc[0]: 
ifnet{} 
le softc() 
in ifaddr() 
in multi() 










224.0.0.1 













pus id 
ia multiaddrs 


in ifaddr: 

















012-13 00000 20000 
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ether_multi (U 12-34) 
le softc[l] arpcom 
IN. LOOKUP. MULTI[|([] 12-14) IP 
2. IP 
131-146 IN_LOOKUP_MULTI ifp addr 
IFP TO IA Internet in ifaddr ifp in ifaddr 
IFP TO IA for IP inm 
in multi 
: n i in_var.h 
131 #define IN_LOOKUP_MULTI (addr, ifp, inm) \ 
132 /* struct in_addr addr; */ N 
133 /* struct ifnet *ifp; */ V 
134 /* struct in multi Sim: */ \ 
135 L \ 
136 struct in ifaddr Tia; \ 
137 \ 
138 IFP TO IA((ifp), ia); \ 
139 if (ia == NULL) \ 
140 (inm) = NULL; \ 
141 else \ 
142 for ((inm) = ia->ia multiaddrs; \ 
143 (inm) != NULL && (inm)->inm_addr.s_addr != (addr).s addr; \ 
144 (inm) = inm->inm next) \ 
145 continue; V 
146 ) . 
in var.h 
O 12-14 IN LOOKUP MULTI |] 
12.7 ip moptions[|[]| 
ip moptions UDP 
ip output 
error = ip_output (m, inp->inp options, &inp->inp route, 
inp->inp socket->so options & (SO DONTROUTE|SO BROADCAST), 
inp->inp_moptions); 
22 inp Internet (PCB) UDP 
socket PCB PCB inp_moptions ip_moptions 
ip_output 
ip_moptions 12-15[] ip moptions 
: s ip var.h 
100 struct ip moptions ( 
101 struct ifnet *imo_multicast_ifp; /* ifp for outgoing multicasts */ 
102 u char imo multicast ttl; /* TTL for outgoing multicasts */ 
103 u char imo multicast loop; /* 1 => hear sends if a member */ 
104 u short imo num memberships; /* no. memberships this socket */ 
105 struct in multi *imo membership [IP MAX MEMBERSHIPS]; 
106 }; 
ip var.h 


O 12-15 ip motions JQ 


2 76 TCP/IP 2 






























































100-106 ip_output imo_multicast_ifp 





China-pubecom 




























































































imo_multicast_ifp (U 140 ) 











 multicast ttl IP TTL 1 











































































































































































































imo multicast loopl| 0 















































imo multicast loop[] I 
























































































































































































































































































































































































































































































































































imo num memberships imo membership { 
} IP IP 
imo_membership in_multi in_multi 




































































in_ifaddr 


























128 0000000 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































12-16 IP ip_moptions 

IP_MULTICAST_IF struct in addr ip ctloutput | 000000000000 

IP MULTICAST TTL u char ip ctloutput | 020000000000 TTL 

IP MULTICAST LOOP u char ip ctloutput | 000000000000 

IP ADD MEMBERSHIP struct ip mred ip ctloutput (0000000 

IP DROP MEMBERSHIP | struct ip mred ip ctloutput | [JD d Hd B D 

U 1216 DD BD 0 D 
8-31 ip_ctloutput 12-17 
ip_output.c 
448 case PRCO_SETOPT: P- tp 
449 switch (optname) { 
O | 

486 case IP_MULTICAST_IF: 
487 case IP_MULTICAST_TTL: 
488 case IP_MULTICAST_LOOP: 
489 case IP_ADD_MEMBERSHIP: 
490 case IP DROP MEMBERSHIP:. 
491 error = ip setmoptions(optname, &inp->inp_moptions, m); 
492 break; 
493 freeit: 
494 default: 
495 error - EINVAL; 
496 break; 
497 } 
498 if (m) 


DH 12-17 ipctlouput 000000 
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12 








IP 
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499 (void) m_free(m); 
500 break; 
501 case PRCO_GETOPT: 
502 switch (optname) { 
539 case IP_MULTICAST_IF: 
540 case IP_MULTICAST_TTL: 
541 case IP_MULTICAST_LOOP: 
542 case IP_ADD_MEMBERSHIP: 
543 case IP_DROP_MEMBERSHIP: 
544 error = ip_getmoptions (optname, inp->inp_moptions, mp); 
545 break; 
546 default: 
547 error = ENOPROTOOPT; 
548 break; 
549 } e " 
ip output.c 
12-17 (0) 
486-491 ip setmoptions[| ip getmoptions 
ip moptions 
539-549 ip getmoptions[| ip setmoptions ioctl 
PRCO SETOPT[| PRCO GETOPT 
ENOPROTOOPT 
12.9 DO TTLO 
TTL TTL IP 
(scope) 
RFC 1122 IP TTL IP 
TTL 0 TTL 
TTL 
TTL[] O 
TTL 
12-18 TTL 
IP ip tti ([Casner 1993]) 
TTL 
32 




































































































































































































































































278 wan n? China-bubcom 
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TTL] 32( 32) TTL 32([] | U 
) — TTL 0 
TTL[] [] 128 32 (O 128- 32=96 
) 128 
31 000000 
32 0000 
63 000000 
64 0000 
95 IETF[] O 200 
127 IETF[] H 100 
128 [ D DI 
159 IETF[] O 20 0 
191 IETFO H 10 D 
223 IETFI 0200000 
255 ETFO 0100000000000 
0 12-18 1P900000 TTLO 





12.9.1 MBONE 




























































































































































































































































































































































































































































































































































































Internet U 0 IP 0 0 [| MBONE,[Casner 
1993] IP —— 
MBONE | 12-18 
TTL 310 0 32 0 0 0 IETF 1 
IP TTL[] 255 MBONE[] MBONE 
MBONE 






























































































































































1292 HUDD 






















































































































































































































































































TTL OOO TTL Doo 
(expanding-ring search[] [Boggs 1982]) TTL [] 0 
TTL[ 1 ( ) 
TTL] 2 2 | | TTL[] 

































































































































































































































































RFC 1546 [Partridge[] Mendez[] Milliken 1993] |] | 
(anycasting)|] L PO L 





















































































































































































































































































































































































































































12.10 ip setmoptions[|[] 



































































































































ip setmoptions switch 12-19 
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ip setmoptions switch 
OPERE — ip output.c 
651 ip setmoptions(optname, imop, m) 
652 int optname; 
653 struct ip moptions **imop; 
654 struct mbuf *m; 
655 ( 
656 int error - 0; 
657 u char loop; 
658 int i; 
659 struct in addr addr; 
660 struct ip mreq *mreq; 
661 struct ifnet *ifp; 
662 struct ip moptions *imo - *imop; 
663 struct route ro; 
664 struct sockaddr in *dst; 
665 if (imo == NULL) { 
666 JE 
667 * No multicast option buffer attached to the pcb; 
668 * allocate one and initialize to default values. 
669 XI 
670 imo = (struct ip moptions *) malloc(sizeof(*imo), M_IPMOPTS, 
671 M, WAITOK); 
672 if (imo == NULL) 
673 return (ENOBUFS); 
674 *imop - imo; 
675 imo->imo multicast ifp = NULL; 
676 imo->imo multicast ttl = I P DEFAULT MULTICAST TTL; 
677 imo->imo multicast loop = IP DEFAULT MULTICAST LOOP; 
678 imo->imo num memberships = 0; 
679 H 
680 Switch (optname) ( 
857 default: 
858 error - EOPNOTSUPP; 
859 break; 
860 } 
861 /* 
862 * If all options have default values, no need to keep the mbuf. 
863 *7 
864 if (imo->imo_multicast_ifp == NULL && 
865 imo->imo_multicast_ttl == IP DEFAULT MULTICAST TTL && 
866 imo->imo_multicast_loop == IP DEFAULT MULTICAST LOOP && 
867 imo->imo_num_memberships == 0) { 
868 free (*imop, M IPMOPTS); 
869 *imop = NULL; 
870 } 
871 return (error); 
872 } l 
ip output.c 
O 12-19 ip setmoptions [00 
650-664 optname imop 


































































































































































































































































































ip_motions *imop ip setmoptions 

































































280 remo a: China-pubıctom 
— 5 Hs 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip_setmoptions ip_moptions 
*imop ip setmoptions ENOBUFS 
error|| error m 
mbuf([] 12-16 ) 
1. 
665-679 ip_moptions ip_setmoptions 
TTL l(IP_DEFAULT_MULTICAST_TTL) 
ip_output 
| U | U 
2. 
680-860 ip_setmoptions switch case 
default ( \ error EOPNOTSUPP 
3. OK 
861-872 switch ip_setmoptions ip_moptions 
ip_setmoptions 0 
12.10.1 IP MULTICAST IF 
optname|| IP MULTICAST IF ip_setmoptions|] mbuf 
12-20 
ip_output.c 
681 case IP_MULTICAST_IF: 
682 ze 
683 * Select the interface for outgoing multicast packets. 
684 */ 
685 if (m == NULL || m->m_len != sizeof (struct in_addr)) { 
686 error = EINVAL; i 
687 break; 
688 } 
689 addr = *(mtod(m, struct in addr *)); 
690 /* 
691 * INADDR ANY is used to remove a previous selection. 
692 * When no interface is selected, a default one is 
693 * chosen every time a multicast packet is sent. 
694 */ 
695 if (addr.s_addr == INADDR_ANY) ( 
696 imo->imo_multicast_ifp = NULL; 
697 break; 
698 } 
699 {* 
700 * The selected interface is identified by its local 
701 * IP address. Find the interface and confirm that 
702 * it supports multicasting. 
703 */ 


[] 12-20 ip setmoptions JOU H H n H H DH H n H 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































704 INADDR TO IFP(addr, ifp); 
705 if (ifp == NULL || (ifp->if flags & IFF MULTICAST) == 0) { 
706 error = EADDRNOTAVAIL; 
707 break; 
708 } 
709 imo->imo_multicast_ifp = ifp; 
710 break; s 
ip_output.c 
[] 12-20 (0) 
1. 
681-698 mbuf mbuf in_addr 
ip_setmoptions EINVAL addr 
INADDR_ANY ip_moptions 
([] 12-40) 
2. 
699-710 addr INADDR_TO_IFP 
EADDRNOTAVAIL ifp 
ip_moptions 
12.10.2 O O TTL[] IP_MULTICAST_TTL 
optname|| IP MULTICAST TTL IP TTL 
TTL[] ip output 12-21 
711 case IP MULTICAST TTL: ip_output.c 
712 Le 
713 * Set the IP time-to-live for outgoing multicast packets. 
714 */ 
715 if (m == NULL || m-»m len !- 1) { 
716 error - EINVAL; 
717 break; 
718 H 
719 imo->imo multicast ttl = *(mtod(m, u_char *)); 
720 break; 5 
ip output.c 
[] 12-21 ip_setmoptions 0000000000 TTL 
TTL 
711—720 imo multicast ttl 
EINVAL 























12.10.3 























IP MULTICAST LOOP 














































































































































































































































































































































































































282 emo n: China-pub.com 
AT 














































































































IP MULTICAST LOOP (U 12-22)[] ip moptionsg 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip output.c 
721 case IP MULTICAST LOOP: 
722 LE 
723 * Set the loopback flag for outgoing multicast packets. 
724 * Must be zero or one. 
725 * 
726 if (m == NULL || m->m len != 1 || 
727 (loop = *(mtod(m, u char *))) > 1) 1 
728 error = EINVAL; 
729 break; 
730 } 
731 imo->imo_multicast_loop = loop; 
732 break; ; 
ip output.c 
[] 12-22 ip setmoptions 0000000090 
721-732 m 1 O[] 1 EINVAL 
imo multicast loopl| 0 1 
12-23 imo_multicast_ttl 
imo_multicast_loop 
12-23 TTL 
( 12.6) 
(U 14[] ) 
1211 JO 00 POOO 
(U 6-17] IP 
( ) in_multi 
ether_multi 
optname[] IP_ADDMEMBERSHIP mbuf 12-24 
ip mreq 
in.h 
148 struct ip_mreq { 
149 struct in addr imr multiaddr; /* IP multicast address of group */ 
150 struct in addr imr interface; /* local IP address of interface */ 
151 }; z 
in.h 


0 12-24 ip mreq U [] 
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148-151 imr_multiaddr imr_interface IP 
ip mreq ( } 
12-25 
setsockopt getsockopt 
first join request if ioct last leave request 


SIOCADDMULTI SIOCDELMULTI 


O 12-25 p000000000 






















































































































































































































































































































































































ip setmoptions([] 12-26)[] IP ADD MEMBERSHIP 
ip_moptions IP — 
LANCE 
733 case IP ADD MEMBERSHIP: Ke hal 
734 /[* 
735 * Add a multicast group membership. 
736 * Group must be a valid IP multicast address. 
737 */ 
738 if (m == NULL || m-»m len != sizeof(struct ip mreq)) ( 
739 error - EINVAL; 
740 break; 
741 } 
742 mreq = mtodím, struct ip mreg +); 
743 if (!IN_MULTICAST (ntohl(mreq--imr multiaddr.s addr))) ( 
744 error = EINVAL; : 
745 break; 
746 } 
747 /* 
748 * If no interface address was provided, use the interface of 
749 * the route to the given multicast address. 
750 */ 
751 if (mreg->imr_interface.s_addr == INADDR_ANY) { 
752 ro.ro_rt = NULL; 
753 dst = (struct sockaddr_in *) &ro.ro_dst; 
754 dst->sin_len = sizeof (*dst); 
755 dst->sin_family = AF_INET; 


[] 12-26 ip setmoptins [D D DJ DD D D DÚ Ú 












































284 wi n2 China"pub.tom 
trett pay 












































































































































































































































































































































756 dst->sin_addr = mreq->imr multiaddr; 

757 rtalloc(&ro); 

758 if (ro.ro rt == NULL) { 

759 error = EADDRNOTAVAIL; 

760 break; 

761 } 

762 ifp = ro.ro rt->rt ifp; 

763 rtfree(ro.ro_rt); 

764 } else { 

765 INADDR_TO_IFP (mreg->imr_interface, ifp); 

766 } 

767 /* 

768 * See if we found an interface, and confirm that it 

769 * supports multicast. 

770 */ 

771 if (ifp == NULL || (ifp->if_flags & IFF_MULTICAST) == 0) { 

772 error = EADDRNOTAVAIL; i 

773 break; 

774 } 

775 ZP 

776 * See if the membership already exists or if all the 

777 * membership slots are full. 

778 */ 

779 for (i = 0; i < imo->imo num memberships; ++i) { 

780 if (imo-»imo membership[i]-»inm ifp == ifp && 

781 imo->imo membership[i]-»inm addr.s addr 

782 == mreq-»imr multiaddr.s addr) 

783 break; 

784 } 

785 if (i < imo->imo_num_memberships) { 

786 error = EADDRINUSE; 

787 break; 

788 } 

789 if (i == IP_MAX_MEMBERSHIPS) { 

790 error = ETOOMANYREFS; 

791 break; 

792 } 

793 /* 

794 * Everything looks good; add a new record to the multicast 

795 * address list for the given interface. 

796 */ 

797 if ((imo->imo membership[i] = 

798 in_addmulti (&mreq->imr_multiaddr, ifp)) == NULL) { 

799 error = ENOBUFS; 

800 break; 

801 ) 

802 ++imo->imo num memberships; 

803 break; ; 

ip output.c 
U 12-26 (0) 
1. 
733-746 ip_setmoptions mbu 
(imr_multiaddr) ip_setmoptions ENIVAL 
Mreq ip mreq 
2. 

747—774 (imr interface)[] INADDR ANY ip setmoptions 
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route 
rtalloc rtalloc 
EADDRNOTAVAIL ifp 
imr interface INADDR ANY INADDR TO IFP 
EADDRNOTAVAIL 
8.5 route 19.2 rtalloc 14 
3. 
775-792 imo_membership 
for | EADDRINUSE 
ETOOMANYREFS 
4. 
793-803 in_addmulti IP 
in_addmulti in_multi ([] 12-12) 
| | 1 
12.11.1 in_addmulti 
in_addmulti | in delmulti([] 12-27 12-36) 
in multi 
in.c 
469 struct in multi * 
470 in,addmulti(ap, ifp) 
471 struct in addr *ap; 
472 struct ifnet *ifp; 
473 ( 
474 struct in multi *inm; 
475 Struct ifreq ifr; 
476 struct in ifaddr *ia; 
477 int S = splnet (); 
478 /* 
479 * See if address already in list. 
480 *7 
481 IN LOOKUP. MULTI (*ap, ifp, inm); 
482 if (inm != NULL) ( 
483 /* 
484 * Found it; just increment the reference count. 
485 * 
486 ++inm->inm_refcount; 
487 } else { : 
in.c 
[] 12-27 in addmulti [000000 
1. 
469-487 ip_setmoptions ap D | | ifpl[l [I DL t 
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in_addmulti 


IN. LOOKUP. MULTI([] 12-14) 
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12-28 
in.c 
487 } else { 
488 FT 
489 * New address; allocate a new multicast record 
490 * and link it into the interface's multicast list. 
491 */ i 
492 inm = (struct in multi +) malloc(sizeof(*inm), 
493 M IPMADDR, M, NOWAIT); 
494 if (inm == NULL) { 
495 splx(s); 
496 return (NULL); 
497 } 
498 inm->inm_addr = *ap; 
499 inm->inm_ifp = ifp; 
500 inm->inm_refcount = 1; 
501 IFP_TO_IA(ifp, ia); 
502 if (ia == NULL) { 
503 free(inm, M_IPMADDR); 
504 splx(s); 
505 return (NULL); 
506 } 
507 inm->inm_ia = ia; 
508 inm->inm_next = ia->ia_multiaddrs; 
509 ia->ia_multiaddrs = inm; 
510 /* 
511 * Ask the network driver to update its multicast reception 
512 * filter appropriately for the new address. 
513 < 
514 ((struct sockaddr_in *) &ifr.ifr_addr)->sin_family = AF_INET; 
515 ((struct sockaddr_in *) &ifr.ifr_addr)->sin_addr = *ap; 
516 if ((ifp->if_ioctl == NULL) l| 
517 (*ifp->if_ioctl) (ifp, SIOCADDMULTI, (caddr_t) & ifr) != 0) ( 
518 ja->ia_multiaddrs = inm->inm next; 
519 free(inm, M IPMADDR) ; 
520 splx(s); 
521 return (NULL); 
522 } 
523 PE 
524 * Let IGMP know that we have joined a new IP multicast group. 
525 */ ; 
526 igmp joingroup (inm); 
527 } 
528 splx(s); 
529 return (inm); 
530 ) ; 
inc 
[] 12-28 in addmulti [000000 
2; in multi 
487-509 in addmulti in multi 
in ifaddr([] 12-13) ia multiaddrs 
3 
510-530 if ioctl in addmulti 
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ifreq ([] 4-23) SIOCADDMULTI 
in multi in addmulti 
igmp joingroup 
in addmultil] | in multi 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































12.11.2 slioct1[] loioctl[|| SIOCADDMULTI| | SIOCDELMULTI 
SLIP | | 12-29 
SLIP 
673 case SIOCADDMULTI: if-sl.c 
674 case SIOCDELMULTI: 
675 ifr = (struct ifreq *) data; 
676 if (ifr == 0) ( ; 
677 error = EAFNOSUPPORT; /* XXX */ 
678 break; 
679 } 
680 switch (ifr->ifr_addr.sa_family) { 
681 case AF_INET: 
682 break; 
683 default: 
684 error = EAFNOSUPPORT; 
685 break; 
686 } 
687 break; . 
if alc 
[]12-29 slioctl (000000 
673-687 AF INET EAFNOSUPPORT 
12-30 
if loop.c 
152 case SIOCADDMULTT: f. loop 
153 case SIOCDELMULTI: 
154 ifr - (struct ifreq *) data; 
155 if (ifr == 0) { 
156 error - EAFNOSUPPORT; /* XXX */ 
157 break; 
158 } 
159 switch (ifr->ifr_addr.sa_family) { 
160 case AF INET: 
161 break; 
162 default: 
163 error = EAFNOSUPPORT; 
164 break; 
165 } 
166 break; I 
—— if loop.c 
D 12-30 iicci 000000 
152-166 | U 12-29[] SLIP 
AF INET EAFNOSUPPORT 
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12.11.3 leioctl SIOCADDMULTI[] SIOCDELMULTI 
4-2 LANCE leioctl[] if ioctll[] 12-31 
| SIOCADDMULTI|| SIOCDELMULTI 
if le.c 
657 case SIOCADDMULTI: 
658 case SIOCDELMULTI: 
659 /* Update our multicast list */ 
660 error = (cmd == SIOCADDMULTI) ? 
661 ether addmulti((struct ifreq *) data, &le->sc_ac) 
662 ether delmulti((struct ifreq *) data, &le->sc_ac); 
663 if (error == ENETRESET) { 
664 /* 
665 * Multicast list has changed; set the hardware 
666 * filter accordingly. 
667 */ 
668 lereset(ifp->if unit); 
669 error = 0; 
670 ) 
671 break; ` 
if_le.c 
0 12-31 1eioci JD 00000 
657-671 leioctl ether_addmulti|| ether_delmulti 
IP ENETRESET 
leioctl lereset | | 
lereset LANCE 
lereset ether multi 
LANCE 
lereset IFP ALLMULTI 
12.11.4 ether addmulti 
ether addmulti SIOCADDMULTI 
IPD (U 12-5) ether_multi 12-32 
ether_multi 
1. 
366-399 ether_addmulti addrlo[] addrhi ( ) 
AF_UNSPEC ether_addmulti 
addrlo[| addrhi AF_INET 
INADDR ANY (0.0.0.00]] ether_addmulti addrlo 
ether_ipmulticast_min addrhi ether_ipmulticast_max 
u_char ether_ipmulticast_min[6] = { 0x01, 0x00, 0x5e, 0x00, 0x00, 0x00 }; 





u_char ether ipmulticast max[6] = { 0x01, 0x00, Ox5e, Ox7f, Oxff, Oxff }; 





Chinaspubscom meno 289 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































- if ethersubr.c 
366 int 
367 ether addmulti(ifr, ac) 
368 struct ifreg *ifr; 
369 struct arpcom *ac; 
370 ( 
371 struct ether multi *enm; 
372 struct sockaddr in "sin; 
373 u_char addrlo[6]; 
374 u_char addrhi[6]; 
375 int s = splimp(); 
376 switch (ifr->ifr_addr.sa_family) { 
377 case AF_UNSPEC: 
378 beopy (ifr->ifr_addr.sa_data, addrlo, 6); 
379 bcopy (addrlo, addrhi, 6); 
380 break; 
381 case AF_INET: 
382 sin = (struct sockaddr_in *) &(ifr->ifr_addr); 
383 if (sin->sin_addr.s_addr == INADDR_ANY) { 
384 /* 
385 * An IP address of INADDR ANY means listen to all 
386 * of the Ethernet multicast addresses used for IP. 
387 * (This is for the sake of IP multicast routers.) 
388 */ 
389 bcopy (ether_ipmulticast_min, addrlo, 6); 
390 bcopy (ether_ipmulticast_max, addrhi, 6); 
391 } else { i 
392 ETHER_MAP_IP_MULTICAST (&sin->sin_addr, addrlo); 
393 bcopy (addrlo, addrhi, 6); 
394 } 
395 break; 
396 default: 
397 splx(s); 
398 return (EAFNOSUPPORT); 
399 } 
if_ethersubr.c 
[] 12-32 ether addmulti [D DD D Ú 
etherbroadcastaddr(4.3[] ) 48 bit 
IP IP INADDR_ANY 
IP IANA IP 
mrouted (8) 

INADDR_ANY SIOCADDMULTI 

ETHER MAP IP MULTICAST IP 

EAFNOSUPPORT 

addrlo|| addrhi 
ether addmulti 12-33 
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2 
if_ethersubr.c 

400 /* . 

401 * Verify that we have valid Ethernet multicast addresses. 

402 */ 

403 if ((addrlo[0] & 0x01) != 1 || (addrhi[0] & 0x01) != 1) { 

404 splx (s); 

405 return (EINVAL); 

406 } 

407 /* 

408 * See if the address range is already in the list. 

409 */ 

410 ETHER LOOKUP MULTI (addrlo, addrhi, ac, enm); 

411 if (enm !- NULL) ( 

412 /* 

413 * Found it; just increment the reference count. 

414 */ 

415 ++enm->enm refcount; 

416 splx(s); 

417 return (0); 

418 } 

419 /* 

420 * New address or range; malloc a new multicast record 

421 * and link it into the interface's multicast list. 

422 */ 

423 enm = (struct ether multi *) malloc(sizeof (*enm), M IFMADDR, M_NOWAIT); 

424 if (enm == NULL) ( 

425 splx(s); 

426 return (ENOBUFS); 

427 } : 

428 bcopy (addrlo, enm->enm addrlo, 6); 

429 bcopy (addrhi, enm->enm_addrhi, 6); 

430 enm->enm_ac = ac; 

431 enm->enm_refcount = 1; 

432 enm->enm_next = ac->ac_multiaddrs; 

433 ac->ac_multiaddrs = enm; 

434 ac-»ac multicnt++; 

435 splx(s); 

436 /* 

437 * Return ENETRESET to inform the driver that the list has changed 

438 * and its reception filter should be adjusted accordingly. 

439 */ i 

440 return (ENETRESET) ; 

441 T 

if ethersubr.c 
O 12-33 ether_adduulti 000000 
2. 
400-418 ether_addmulti (O 4-12) 
ETHER LOOKUP MULTI([] 12-9) 
ether multi (enm refcount) 
ether addmulti 0 
3. ether multi 

419-441 ether_multi 






















































































































































































arpcom 

















12-8) 














ac 








multiaddrs 





















































ether_addmulti 
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ENETRESET 
12-34 LANCE ip moptions[| in multi 
ether multi 
ifnet: 







arpcom() 


ether multi() 


01:00:5e:00:00:01 
01:00:5e:00:00:01 


enm ac 


enm refcount 


in_moptions (4 


multicast ifp 


















il 
ac multiaddrs 


in ifaddr() in multi() 






membership [20] 



















01234 pg00000000 


1212 JO00 POODO 
































































































































































































































































































































































































































ip moptions IP in multi ether multi 
ip setmoptions IP DROP MEMBERSHIP 12-35 
804 case IP DROP MEMBERSHIP: ip output.c 
805 /* 
806 * Drop a multicast group membership. 
807 * Group must be a valid IP multicast address. 
808 */ 
809 if (m == NULL || m-»m len != sizeof(struct ip mreq)) { 
810 error - EINVAL; 
811 break; 
812 H 
813 mreq - mtod(m, struct ip mreq *); 
814 if (!IN MULTICAST (ntohl (mreq-»imr multiaddr.s addr))) { 
815 error - EINVAL; 
816 break; 
817 } 
818 /* 
819 * If an interface address was specified, get a pointer 
820 * to its ifnet structure. 
821 */ 
822 if (mreq->imr interface.s addr == INADDR ANY) 
823 ifp - NULL; 
824 else ( 
825 INADDR TO IFP(mreq->imr interface, ifp);. 


D 12-35 ip setmoptins 2000000000 
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826 if (ifp == NULL) { 
827 error = EADDRNOTAVAIL; 
828 break; 
829 } 
830 } 
831 /* 
832 * Find the membership in the membership array. 
833 */ 
834 for (i = 0; i < imo->imo_num_memberships; ++i) { 
835 if ((ifp == NULL |l 
836 imo->imo_membership[i]->inm_ifp == ifp) && 
837 imo->imo membership[i]->inm addr.s addr == 
838 mreq-»imr multiaddr.s addr) 
839 break; 
840 H 
841 if (i == imo->imo num memberships) { 
842 error - EADDRNOTAVAIL; 
843 break; 
844 } 
845 /* 
846 * Give up the multicast address record to which the 
847 * membership points. 
848 */ 
849 in delmulti (imo->imo_membershipli]); 
850 /* 
851 * Remove the gap in the membership array. 
852 */ 
853 for (++i; i < imo->imo_num_memberships; ++i) 
854 imo->imo_membership[i - 1] = imo->imo_membershipli]; 
855 --imo->imo num memberships; E 
856 break; 7 
ip_output.c 
U 12-35 (U) 
1. 
804-830 ip_mreq imr_multiaddr 
imr_interface 
EINVAL|| EADDRNOTAVAIL switch 
2. 
831-856 for { } in_multi 
EADDRNOTAVAIL in_delmulti in_multi 
for 





















































































































































































































































12.12.1 in_delmulti 



























































in delmulti([] 12-36) 



























































in multi 




























































































in multi 





















































































































































































































































































































































534-567 in delmulti in multi 
0 { } 
igmp_leavegroup 13.8 
for in_multi 
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: in.c 
534 int 
535 in_delmulti (inm) 
536 struct in multi *inm; 
537 ( 
538 Struct in multi **p; 
539 struct ifreq ifr; 
540 int S - gplnet(); 
541 if (--inm-»inm refcount -- 0) ( 
542 ER 
543 * No remaining claims to this record; let IGMP know that 
544 * we are leaving the multicast group. 
545 af 
546 igmp leavegroup(inm); 
547 /* 
548 * Unlink from list. 
549 */ 
550 for (p = &inm-»inm ia-»ia, multiaddrs; 
551 *p != inm; 
552 p = &(*p)-»inm next) 
553 continue; 
554 XD = (*p)-»inm next; 
555 /* . 
556 * Notify the network driver to update its multicast reception 
557 * filter. 
558 */ 
559 ((struct sockaddr_in *) &(ifr.ifr addr))->sin family = AF INET; 
560 ((struct sockaddr_in *) &(ifr.ifr_addr))->sin_addr = 
561 inm->inm_addr; 
562 (*inm->inm_ifp->if_ioctl) (inm->inm_ifp, SIOCDELMULTI, 
563 (caddr_t) & ifr); 
564 free(inm, M_IPMADDR) ; 
565 } 
566 splx(s); 
567 ) . 
in.c 
O 12-36 in delmulti QQ 
for continue 
continue 
12-9 ETHER LOOKUP MULTI continue 
in multi in delmulti 
SIOCDELMULTI 

ether multi| in multi 

LANCE SIOCDELMULTI 12-31 

SIOCADDRMULTI 












































12.12.2 ether delmulti 











































































































IP in multi 






























































































































































ether multi = = IP IP ether_ 
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multi 0 12-37[] ether_delmulti 
if_ethersubr.c 



























































































































































445 int 

446 ether delmulti(ifr, ac) 
447 struct ifreq *ifr; 

448 struct arpcom *ac; 


449 ( 

450 Struct ether, multi *enm; 

451 struct ether multi **p; 

452 struct sockaddr in *sin; 

453 u_char addrlo[6]; 

454 u char addrhi[6]; 

455 int S = splimp(); 

456 switch (ifr->ifr addr.sa family) ( 

457 case AF UNSPEC: 

458 bcopy (ifr->ifr addr.sa data, addrlo, 6); 

459 bcopy (addrlo, addrhi, 6); 

460 break; 

461 case AF_INET: 

462 sin = (struct sockaddr_in *) &(ifr->ifr_addr); 
463 if (sin->sin_addr.s_addr == INADDR_ANY) { 

464 /* i 

465 * An IP address of INADDR ANY means stop listening 
466 * to the range of Ethernet multicast addresses used 
467 * for IP. 

468 */ 

469 bcopy (ether ipmuiticast min, addrlo, 6); 
470 bcopy (ether ipmulticast max, addrhi, 6); 
471 ) else I I 

472 ETHER_MAP_IP_MULTICAST (&sin->sin_addr, addrlo); 
473 bcopy(addrlo, addrhi, 6); 

474 } 

475 break; 

476 default: 

477 splx(s); 

478 return (EAFNOSUPPORT) ; 

479 } 

480 /* 

481 * Look up the address in our list. 

482 */ . 

483 ETHER LOOKUP MULTI (addrlo, addrhi, ac, enm); 

484 if (enm == NULL) ( 

485 splx(s); 

486 return (ENXIO); 

487 ) 

488 if (--enm->enm refcount != 0) ( 

489 /* 

490 * Still some claims to this record. 

491 */ 

492 splx(s); 

493 return (0); 

494 } 

495 /* 

496 * No remaining claims to this record; unlink and free it. 
497 */ 


O 12-37 ether delmulti OD 
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498 for (p = &enm->enm ac->ac multiaddrs; 
499 xp !- enm; I 
500 p = &(*p)->enm_next) 
501 continue; 
502 *p = (*p)->enm_next; 
503 free (enm, M IFMADDR); 
504 ac->ac_multicnt--; 
505 splx(s); 
506 /* 
507 * Return ENETRESET to inform the driver that the list has changed 
508 * and its reception filter should be adjusted accordingly. 
509 */ 
510 return (ENETRESET); 
511 ) š 
if_ethersubr.c 
DH 12-37 (0) 
445-479 ether_delmulti ether_addrmulti 
addrlo|] addrhi 
1. ether multi 
480-494 ETHER_LOOKUP_MULTI ether_multi 
ENXIO 1 
ether_delmulti o 
= Inn 
2. ether multi 
495-511 for ether multi 
ENETRESET 
12.13 ip getmoptions[|[| 
ip getmoptions 12-38 
876-914 ip getmoptions optname imo 
ip moptions mp mbu m get mbuf] 
( addr[] ttl[] loop) mbu mbuf 
IP MULTICAST IF IFP TO IA 
INADDR ANY 
IP MULTICAST TTL[] imo multicast ttl E TTL 
l(IP DEFAULT MULTICAST TTL) 
IP MULTICAST LOOP imo multicast loopllll 
l(IP DEFAULT MULTICAST LOOP) 
EOPNOTSUPP 
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ip_output.c 
876 int p-outpu 

877 ip getmoptions(optname, imo, mp) 

878 int optname; 

879 struct ip moptions *imo; 

880 struct mbuf **mp; 

881 ( 

882 u char *ttl; 

883 u char *loop; 

884 struct in addr *addr; 

885 struct in ifaddr *ia; 

886 *mp - m get(M WAIT, MT SOOPTS); 

887 switch (optname) ( 

888 case IP MULTICAST IF: 

889 addr = mtod(*mp, struct in_addr +); 

890 (*mp)-»m len = sizeof (struct in_addr); 

891 if (imo == NULL || imo->imo multicast ifp == NULL) 

892 addr-»s, addr = INADDR ANY; 

893 else ( i 

894 IFP TO IA(imo->imo multicast ifp, ia); 

895 addr->s addr = (ia == NULL) ? INADDR ANY 

896 : IA SIN(ia)->sin addr.s adår; 

897 } 

898 return (0); 

899 case IP_MULTICAST_TTL: 

900 ttl = mtod(*mp, u char *); 

901 (*mp)->m len = 1; 

902 *ttl = (imo == NULL) ? IP_DEFAULT_MULTICAST_TTL 

903 imo->imo multicast ttl; 

904 return (0); 

905 case IP MULTICAST LOOP: 

906 loop = mtod(*mp, u char *); 

907 (*mp)->m len = 1; 

908 *loop = (imo == NULL) ? IP DEFAULT MULTICAST LOOP 

909 imo->imo_multicast_loop; 

910 return (0); 

911 default: 

912 return (EOPNOTSUPP); 

913 y 

914 3 P 

ip output.c 
O 12-38 ip getmoptions [00 
12.14 IO U U U 0 0 àpintz[ O 
IP 
-13 ether input IP 
IP (ipintra) mbu M_MCAST ipintr 
ipintr 12-39 
ipintr 







































































































































































































































































ip IP 
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214-245 IP 
IP (ip_mrouter) ip_id 
(ip_mforward ) ip_mforward 
(multicast tunnel) ip_mforward 
ips_cantforward 1 
14 IP 
ip_mforward ipintr 
ip_mforward 0 ip_id ipintr 
ip IGMP ours[] (0 10-11[] ipintr) 
IGMP IGMP 
246-257 12-39 
IN_LOOKUP_MULTI 
ipintr([] 10-11)[] ours 
- - - ip_input.c 

214 if (IN_MULTICAST (ntohl (ip->ip_dst.s_addr))) { 

215 struct in_multi *inm; 

216 extern struct socket *ip_mrouter; 

217 if (ip_mrouter) { 

218 "Abé 

219 * If we are acting as a multicast router, all 

220 * incoming multicast packets are passed to the 

221 * kernel-level multicast forwarding function. 

222 * The packet is returned (relatively) intact; if 

223 * ip mforward() returns a non-zero value, the packet 

224 * must be discarded, else it may be accepted below. 

225 * 

226 * (The IP ident field is put in the same byte order 

227 * as expected when ip mforward() is called from 

228 * ip output().) 

229 */ 

230 ip->ip id = htons(ip-»ip id); 

231 if (ip mforward(m, m-»m pkthdr.rcvif) != 0) ( 

232 ipstat.ips_cantforward++; 

233 m_freem (m); 

234 goto next; 

235 } 

236 ip->ip_id = ntohs (ip->ip_id); 

237 /* 

238 * The process-level routing demon needs to receive 

239 * all multicast IGMP packets, whether or not this 

240 * host belongs to their destination groups. 

241 */ 


O 12-39 ipintr [IH LL D BED U 












































298 zn n: Chinabubecom 
TET u | 
































































































































































































































































































































































































































































































































242 if (ip->ip_p == IPPROTO_IGMP) 
243 goto ours; 
244 ipstat.ips_forward++; 
245 } 
246 /* 
247 * See if we belong to the destination multicast group on the 
248 * arrival interface. 
249 */ 
250 IN LOOKUP MULTI (ip->ip dst, m-»m pkthdr.rcvif, inm); 
251 if (inm -- NULL) ( 
252 ipstat.ips_cantforward++; 
253 m freem(m); 
254 goto next; 
255 } 
256 goto ours; 
257 3 ES 
ip inpul.c 
O 12-39 (03 
12.15 0000000 ip—output0 D 
8 ip output ip. output[] mp 
ip output mp ip moptions 
ip output 12-40 12-41 ip m 
mbuf[] ifp 
- - - ip output.c 

129 if (IN MULTICAST (ntohl(ip-»ip dst.s addr))) { 
130 Struct in multi *inm; 
131 extern struct ifnet loif; 
132 m->m flags |= M_MCAST; 
133 pE 
134 * IP destination address is multicast. Make sure "Ast" 
135 * still points to the address in "ro". (It may have been 
136 * changed to point to a gateway address, above.) 
137 */ 
138 dst = (struct sockaddr in +) £ro->ro_dst; 
139 za 
140 * See if the caller provided any multicast options 
141 */ 
142 if (imo != NULL) { 
143 ip->ip_ttl = imo-»imo multicast ttl; 
144 if (imo-»imo multicast ifp != NULL) 
145 ifp = imo->imo multicast ifp; 
146 ) eise 
147 ip->ip ttl = IP DEFAULT MULTICAST TTL; 
148 /* 
149 * Confirm that the outgoing interface supports multicast. 
150 */ 
151 if ((ifp-»if flags & IFF_MULTICAST) == 0) { 
152 ipstat.ips noroute++; 
153 error = ENETUNREACH; 
154 goto bad; 
155 } 
156 /* 


O 12-40 ip output U 0 00 00 0 0 0 
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157 * If source address not specified yet, use address 
158 * of outgoing interface. 
159 */ 
160 if (ip->ip_src.s_addr == INADDR ANY) { 
161 struct in ifaddr *ia; 
162 for (ia = in ifaddr; ia; ia = ia->ia next) 
163 if (ia->ia_ifp == ifp) { 
164 ip->ip_src = IA SIN(ia)->sin addr; 
165 break; 
166 ) 
167 } 
ip_output.c 
O 12-40 (O) 
- - - - ip_output.c 
168 IN_LOOKUP_MULTI (ip->ip_dst, ifp, inm); 
169 if (inm != NULL && 
170 (imo == NULL || imo->imo_multicast_loop)) { 
171 /* 
172 * If we belong to the destination multicast group 
173 * on the outgoing interface, and the caller did not 
174 * forbid loopback, loop back a copy. 
175 */ 
176 ip_mloopback(ifp, m, dst); 
177 } else { 
178 /* 
179 * If we are acting as a multicast router, perform 
180 * multicast forwarding as if the packet had just 
181 * arrived on the interface to which we are about 
182 * to send. The multicast forwarding function 
183 * recursively calls this function, using the 
184 * IP FORWARDING flag to prevent infinite recursion. 
185 u 
186 * Multicasts that are looped back by ip mloopback(), 
187 * above, will be forwarded by the ip input() routine, 
188 * if necessary. 
189 */ 
190 extern struct socket *ip_mrouter; 
191 if (ip_mrouter && (flags & IP_FORWARDING) == 0) ( 
192 if (ip_mforward(m, ifp) != 0) ( 
193 m_freem(m); 
194 goto done; 
195 } 
196 } 
197 } 
198 /* 
199 * Multicasts with a time-to-live of zero may be looped- 
200 * back, above, but must not be transmitted on a network. 
201 * Also, multicasts addressed to the loopback interface 
202 * are not sent -- the above call to ip mloopback() will 
203 * loop back a copy if this host actually belongs to the 
204 * destination group on the loopback interface. 
205 */ å 
206 if (ip-»ip ttl == 0 || ifp == &loif) ( 
207 m_freem(m) ; 
208 goto done; 
209 } 
210 goto sendit; 
211 } : 
ip output.c 





O 12-41 ip output U 00000 000 0 U 
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TCP/IP 2 
1. 
129-155 12-40 ip_output 
mbuf[] [| M MCAST dst | ip output 
(Y 8-240 
ip_moptions ip_ttl||] ifp ip ttl 
I(IP DEFAULT MULTICAST TTL) 
ip moptions ip output 
O  ENETUNREACH[ 
2. 
156-167 for IP 
ip_src 
12-41 ip_output 
3. 
168-176 IN_LOOKUP_MULTI 
imo_multicast_loop ip_mloopback 
LU | U U LU LU 
4. 
178-197 
ip_mforward ip_mforward 0 
ip_output 
ip mforwardl| ip output ip mforward 
ip output IP FORWARDING 
| IF FORWARDING[] 
5. 
198-209 TTL[] 0 (ip_mforward ) 
TTL[] 0 ip_output TTL 
ip_mloopback 
6. 
210-211 
sendit(ip_output 8-25) if_output 
21.10 ether_output arpresolve 




































































































































































301 


12 


IP 


























arpresolve 
































ER MAP MULTICAST 


















































































































































IP 
































ETH 





ER MAP MULTICAST 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ip mloopback 
ip mloopback looutput([] 5-27) ip mloopback 
looutput 12-42 
ip mloopback 
ip output.c 
935 static void p_owp 
936 ip_mloopback (ifp, m, dst) 
937 struct ifnet *ifp; 
938 struct mbuf *m; 
939 struct sockaddr in *dst; 
940 ( 
941 struct ip *ip; 
942 struct mbuf *copym; 
943 copym = m_copy (m, 0, M_COPYALL); 
944 if (copym != NULL) { 
945 {* 
946 * We don’t bother to fragment if the IP length is greater 
947 * than the interface’s MTU. Can this possibly matter? 
948 £7 
949 ip = mtod(copym, struct ip *); 
950 ip->ip len = htons((u short) ip->ip_len); 
951 ip->ip off = htons((u short) ip->ip off); 
952 ip->ip sum = 0; 
953 ip->ip sum = in cksum(copym, ip->ip hl << 2); 
954 (void) looutput (ifp, copym, (struct sockaddr *) dst, NULL); 
955 } 
956 } ; 
ip output.c 
O 12-42 ip mloopback [] [| 
929-956 
ip mloopback[| ip leni ip off looutput 
IP 
12.16 ODDO 
Net/3 
ipintr | | U IP 
IP IP 
12.17 HH 
IP IP[] D 
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in-multi[] ether multi IP 
IP 
INADDR ANY 
SIOCADDMULTI 
ip moptions | | TTL 
in, multi[] | 
IP 
TTL 
U U 
12.1 IP 255.255.255.255 IP 224.0.0.1 
12.2 IP 
IP 
12.3 12.3 32[] IP 32 bit 
9 bit 5122] IP 
12.4 IP MAX MEMBERSHIPS 20 
ip moptions (O 12-15) 
12.5 IP ( ) 
12.6 
12.7 SLIP 
12.8 IP MAX MEMBERSHIPS 
12.9 
12.10 IP 
12.11 in_delmulti SIOCDELMULTI 
ioctl 
12.12 ip getmoptions mbuf| 
12.13 


































































































































































































ipsu ttn 


O 130 


IGMP|] Internet] 0000 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































13.1 q 
IGMP “ " 
IGMP IGMP IGMP RFC 1112 1 13 
IGMP 
IGMP IP (2) 
IP OT ICMP ) ICMP IGMP 
IGMP IGMP 
13-1 Net/3[] IGMP 
rip_input rip_output 
aa | 
nl 
L FP 
AA AS IGMP 
IP =} ----- 
ipintr ip_output 
U 13-1 IGMPO OOO 
IGMP 13-1 in_multi IGMP 
igmp_input in_multi igmp_fasttimo 
igmp_fasttimo igmp_sendreport 
12 in_multi ip_setmoptions 
igmp joingroup[|igmp joingroup igmp sendreport 
igmp sendreport IGMP 





































































































































































































304 TCPAPDO 02000 China-bubıtoM 
E 


U U U U U D'U ip output[] 

































































U U 13-10 000000000000 l U U UD U U U 0 U U U IGMPL [| 
132 OUOU 
0132000000 IGMP] D O 40 0 | 
U U 
netinet/igmp.h IGMP] 0 ] Ü 
netinet/igmp var.h IGMP] 0 D Ü 


netinet/in_var.h IP] GB D B 








netinet/igmp.c IOMP 0 ] O 





0132 oO00000 





18.2.1 TOR 











U U 0 D 0 0 0 0 00000 DDD 13-300 

















0 0 DUDU 0 H 
igmp all hosts group u long O00000"O0000" 00 
igmp timer are running | int ODO I1GMPIODO000000000000 
igmp stat struct igmpstat IGMP] [] (0 13-4) 





114 15000000 


















































































































































1822 [TEL T] 
IGMP{] [] O 13-4[] igmpstat|] | 

Igmpstat[][] [] L| 
igps_rcv_badqueries 000000000000 
igps_rcv_badreports D D D DDD DDD DD D 
igps_rcv_badsum OOOO00000000 
igps rev ourreports O0O00000000000 
igps rev queries OOOOO0000000000 
igps rev reports OO0O000000000000 
igps rev tooshort 0000000090 
igps rev total DU DDD DDD 
igps snd reports O0O000000000000 

O 13-4 IGMP] D 











13-5[] [| vangogh.cs.berkeley.edul] [| [| netstat -p igmp[] [] | | 


















































i U U U 0 0 D vengoghl 000000 IGMPH HE UO D U 0 UO D vangogh] 
0000000 igps_snd_reportsl|] 00 


























EE 
— 
LA 
1 
CA 





















































Cha =. 305 

































































netstat -p igmp [ [0 igmpstat | [] 


18774 messages received igps rev total 
0 messages received with too few bytes igps rcv. tooshort 

0 messages received with bad checksum igps rcv badsum 
18774 membership queries received igps rcv queries 

0 membership queries received with invalid field(s) igps rcv badqueries 
membership reports received igps. rcv, reports 
membership reports received with invalid field(s) igps. rcv badreports 
membership reports received for groups to which we belong | igps rcv ourreports 
membership reports sent igps snd reports 





























GO ooo 





U 13-5 IGMPO D ] Ü 
















































































































































































































































































13.2.3 SNMP 
IGMP SNMP MIB [McCloghrie Farinacci 1994a] IGMP 
MIB 
13.3 igmp[] | 
IGMP 8 13-6 Net/3 igmp 
43 struct igmp { igmp.h 
44 u_char igmp_type; /* version & type of IGMP message */ 
45 u_char igmp_code; /* unused, should be zero */ 
46 u_short igmp_cksum; /* IP-style checksum */ 
47 struct in_addr igmp group; /* group address being reported */ 
48 ); /* (zero for queries) */ 0. 
igmp.h 
[] 13-6 igmp|] D 
igmp_type 4 bit 4 bit 13-7 





























































































































Ox11(IGMP HOST MEMBERSHIP QUERY) 000000 
0x11 (IGMP HOST MEMBERSHIP REPQR[T[][I[ DU Ú 
0x13 DVMRPT[ O ( 140 ) 











































D 13-7 IGMPJ ODO 


la IGMP) D — 


Å qo BM Es 


l 400 


e minn — h 


013-8 xee [| 0 (00 igp) 
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IH 020 
43-44  Net/3[][] IH lU U U U U U U U U U 11 O D (IGMP_HOST_MEMBERSHIP_ 
QUERY)| LU U U U U LU U U U U HD 10 IGMPI 000 l U OI 
[] (zGMP. HOST. MEMBERSHIP REPORI)J[|[] DO 0000 3000000 
U U U U U U (U 400000000 300000 01002 
45-46 IGMP 1 igmp_codel] igmp_cksum|] IP IGMP 
18 
47-48 igmp_groupl] (| O 0 i 
13-80 0 UU IP O | IGMP JOD 
13.4 IGMP[] protosw|] [1 [J 
13-9[] IGMP[] protosw[] [| 
0 D Inetsw[5] U O 
pr_type SOCK_RAW IGMP 0000000 
pr_domain &inetdomain IGMP] Internet] 0 000 
pr_protocol IPROTO_IGMP (2) 000 IP] U ip ell 
pr_flags PR ATOMIC|PR ADDR | DH nnn 
pr input igmp input OPOOOOD 
pr output rip output O PO O O IGMPT] [] 
pr ctlinput 0 IGMP|[] OOO 
pr_ctloutput rip_ctloutput 000000000090 
Pr usrreg rip usrreg O0O000000000 
pr init igmp init N IGMPO O O 
pr fasttimo igmp fasttino OOO00000000 
pr slowtimo 0 IGMP] D [1 O 
pr_drain 0 IOMP D D O 
pr_sysctl 0 IGMP|[] D O O 
U 13-9 IGMP protosw [] DD 
IGMP protosw IP| OO! DO! 
O D IGMP[] 0 0 0 320 O000000 IGMP 
ut IGMP 0 
*«OOOO000 Ul U (13.50 )| 
. IGMP (13.60 OI 
. O O IGMPO O (13.7[] ) 
| | | IGMP[] | 
e IGMP (137000 
. (13.8[] ) 
LU | | ui 
























































18.5 0000060 igmp_joingroupl] U 


0012000 U U 
igmp joingroup 0000| 





























a 








| in multi] [| [1 [1] [1] [1] [] in addmulti[] 
U U U U in multi[]| 00000 
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igmp_joingroup[] igmp_joingroup 13-10 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































igmp.c 
164 void emp 
165 igmp_joingroup (inm) 
166 struct in multi *inm; 
167 { 
168 int s = splnet(); 
169 if (inm->inm_addr.s_addr == igmp_all_hosts_group || 
170 inm->inm_ifp == &loif) 
171 inm->inm_timer = 0; 
172 else { 
173 igmp sendreport(inm); 
174 inm->inm timer = IGMP RANDOM DELAY (inm->inm addr); 
175 igmp timers are running - 1; 
176 ) 
177 splx(s); 
178 3 ] 
igmp.c 
O 13-10 igmp_joingroup UL 
164-178 inm in multi = " 
inm timer igmp joingroup " d 
igmp timers are running 
igmp fasttimo (13.6[] ) 
59273 2 
IGMP_RANDOM_DELAY (13-11[] ) 
igmp_var.h 


60 * Macro to compute a random timer value between 1 and (IGMP_MAX_REPORTING_ 
* DELAY * countdown frequency). We generate a "random" number by adding 

62 * the total number of IP packets received, our primary IP address, and the 
* multicast address being timed-out. The 4.3 random() routine really 

64 * ought to be available in the kernel! 
















































































































































































65 */ 

66 #define IGMP RANDOM DELAY (multiaddr) N 

67 /* struct in_addr multiaddr; */ \ 

68 ( (ipstat.ips total + \ 

69 ntohl (IA SIN(in ifaddr)-»sin addr.s addr) + \ 

70 ntohl((multiaddr).s addr) \ 

71 IN 

72 % (IGMP MAX HOST REPORT DELAY * PR FASTHZ) + 1 \ 

73 ) š 

igmp var.h 
0 13-11 IGMP RANDOM DELAY  [][] 
RFC 1122 O[] 10 (IGMP MAX HOST. 

REPORT DELAY) IGMP S[] (PR FASTHZ) IGMP RANDOM. 
DELAY 1-50 r IP 
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0< (rmod50)= 49 
1< (rmod50)+1= 50 
0 
13.6 igmp fasttimo[|[| 
igmp fasttino in multi 
in multi Net/3 in multi 
























































































































































in multistep ( 13-12 ) 














































































































































































































































































































in var.h 
123 struct in multistep ( n 
124 struct in ifaddr *i ia; 
125 struct in multi *i inm; 
126 }; ` 
in var.h 
O 13-12 in multistep J] J 
123-126 i ia in ifaddr i inm in multi 
IN FIRST MULTI[] IN NEXT. MULTI[]( 13-13) 
in var. 
147 /* 
148 * Macro to step through all of the in multi records, one at a time. 
149 * The current position is remembered in "step", which the caller must 
150 * provide. IN FIRST MULTI(), below, must be called to initialize "step" 
151 * and get the first record. Both macros return a NULL "inm" when there 
152 * are no remaining records. 
153 */ 


154 #define IN NEXT MULTI(step, inm) \ 


155 
156 
157 ( ÓN 
158 
159 
160 
161 
162 
163 
164 
165 
166 
167 
168 
169 ) 


/* struct in multistep step; */ \ 
/* struct in multi *inm; */ \ 


if (((inm) = (step).i inm) != NULL) \ 
(step).i inm = (inm)-»inm next; \ 
else \ 
while ((step).i ia != NULL) ( \ 
(inm) = (step) .i_ia->ia_multiaddrs; N 
(step) .i_ia = (step).i ia-»ia next; \ 
if ((inm) != NULL) { \ 
(step) .i_inm = (inm)->inm_next; \ 
break; \ 
IN 
IN 


170 #define IN_FIRST_MULTI (step, imm) \ 


171 

172 

173 L N 
174 

175 

176 

177 y 


/* struct in multistep step; */ \ 
/* struct in multi Sim: */ N 


(step) .i_ia = in ifaddr; \ 
(step) .i_inm = NULL; \ 
IN NEXT MULTI ( (step), (inm)); \ 


in var.h 

















0 13-13 IN FIRST MULTI [] IN NEXT MULTI QQ 
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154-169 in_multi i_inm IN_NEXT 
MULTI i_ia i_inm 
in_multi while 
170-177 in multistep in ifaddr in ifaddr 
i inm IN NEXT MULTI in multi||| 

13-9[] igmp fasttimo[] IGMP 5 
igmp fasttimo( 13-14) 















































































































































































































































































































































































































































































































































































































































































































































































































































igmp.c 
187 void smp 
188 igmp fasttimo() 
189 { 
190 struct in multi *inm; 
191 int 8; 
192 struct in multistep step; 
193 /* 
194 * Quick check to see if any work needs to be done, in order 
195 * to minimize the overhead of fasttimo processing. 
196 */ 
197 if (ligmp timers, are running) 
198 return; 
199 S - splnet(); 
200 igmp timers are running - 0; 
201 IN_FIRST_MULTI (step, inm); 
202 while (inm != NULL) { 
203 if (inm->inm_timer == 0) { 
204 /* do nothing */ 
205 } else if (--inm->inm_timer == 0) { 
206 igmp_sendreport (inm); 
207 } else { 
208 igmp_timers_are_running = 1; 
209 } 
210 IN_NEXT_MULTI (step, inm); 
211 } i 
212 splx(s); 
213 } . 
ISMP.C 
O 13-14 igmp fasttino {J JJ 
187-198 igmp timers are running igmp fasttimo 
199-213 igmp fasttimo U L IN FIRST MULTI step 
inm[|| igmp fasttimo while in multi IN NEXT MULTI 
. 0 
. 0 0 IGMP 
° 0 igmp_timers_are_ 
running 1 


























310 


igmp_sendreport 


igmp_sendreport (U 13-15) IGMP 


214 stat 





TCP/IP 2 

























































































































































































ic void 


215 igmp_sendreport (inm) 
216 struct in multi *inm; 


* Assume max linkhdr + sizeof(struct ip) + IGMP_MINLEN 


* is smaller than mbuf size returned by MGETHDR. 


m->m len = sizeof(struct ip) + IGMP MINLEN; 
m-»m pkthdr.len = sizeof(struct ip) + IGMP MINLEN; 


ip-»ip len = sizeof(struct ip) + IGMP_MINLEN; 


igmp->igmp_type = IGMP_HOST_MEMBERSHIP_REPORT; 
inm->inm_addr; 


in_cksum(m, IGMP_MINLEN); 


* Request loopback of the report if we are acting as a multicast 
* router, so that the process-level routing demon can hear it. 


imo->imo multicast loop = (ip_mrouter != NULL); 


[ 13-15 igẹ sentreport ID 



























































inm in_multi igmp 


























sendreport 


China-pubecom 


igmp.c 


igmp.c 
































217 { 
218 struct mbuf *m; 
219 struct igmp *igmp; 
220 struct ip *ip; 
221 struct ip_moptions *imo; 
222 struct ip_moptions simo; 
223 MGETHDR(m, M_DONTWAIT, MT_HEADER) ; 
224 if (m == NULL) 
225 return; 
226 ZS 
227 
228 
229 */ 
230 m->m_data += max_linkhdr; 
231 
232 
233 ip = mtod(m, struct ip *); 
234 ip->ip_tos = 0; 
235 
236 ip->ip_off = 0; 
237 ip->ip_p = IPPROTO_IGMP; 
238 ip-»ip src.s addr = INADDR ANY; 
239 ip-»ip dst = inm->inm addr; 
240 igmp = (struct igmp *) (ip + 1); 
241 
242 igmp->igmp code = 0; 
243 igmp->igmp group = 
244 igmp->igmp_cksum = 0; 
245 igmp->igmp_cksum = 
246 imo = &simo; 
247 bzero((caddr t) imo, sizeof(*imo)); 
248 imo->imo_multicast_ifp = inm->inm_ifp; 
249 imo->imo multicast ttl = 1; 
250 FE 
251 
252 
253 */ 
254 { 
255 extern struct socket *ip_mrouter; 
256 
257 } 
258 ip_output (m, NULL, NULL, 0, imo); 
259 ++igmpstat.igps_snd_reports; 
260 } 
214-232 
mbuf 































































































IGMP igmp_sendreport 


















































mbuf 
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uultu IGMP] [] H H U D 
233-245 IP IGMP[] |] | INADDR ANY 
ip output g INADDR_ANY 0 
LU U L u (U | | O O PO 0 )0 
246-260 O [] igmp_sentreport[]| [| [| [| ip moptions] U OO 
[| ip output in multi] [J | UD III 0000 TrL[] 00 100 
LU LU U 0 U | ul i L i O | ul ul L 
Og Og 12.14 ul 
N IGMPO D 00 U 
IGMP[] igmp input[] pr inputi (U 13-9) 
13.7 00000 igmp_input|] |] 
12.14 LU U U ipintr U U UD U U U U U U U U U U U U U U U U 0 U 
IGMP i | i | U U U | IGMP O (| O | | 
0 000000) 
OOO igmp input[] igmp_input 000090 | 13-16 
OM uit E IGMP gt 
igmp.c 
52 void Smp. 
53 igmp input (m, iphlen) 
54 struct mbuf *m; 
55 int iphlen; 
56 ( 
57 struct igmp *igmp; 
58 struct ip *ip; 
59 int igmplen; 
60 struct ifnet *ifp - m-»m pkthdr.rcvif; 
61 int minlen; 
62 struct in multi *inm; 
63 struct in ifaddr *ia; 
64 struct in multistep step; 
65 ++igmpstat.igps rcv, total; 
66 ip = mtod(m, struct ip *); 
67 igmplen = ip->ip len; 
68 /* 
69 * Validate lengths 
70 */ 
71 if (igmplen < IGMP_MINLEN) ( 
72 ++igmpstat.igps rcv tooshort; 
73 m_freem(m); 
74 return; 
75 } 
76 minlen = iphlen + IGMP_MINLEN; 
77 if ((m->m flags & M_EXT || m->m len < minlen) && 
78 (m = m pullup(m, minlen)) == 0) ( 
79 ++igmpstat.igps rcv tooshort; 
80 return; 
81 } 


O 13-16 igẹ input TT JJ 
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TCP/IP 2 
82 pe 
83 * Validate checksum 
84 */ 
85 m->m_data += iphlen; 
86 m->m_len -= iphlen; 
87 igmp = mtod(m, struct igmp *); 
88 if (in_cksum(m, igmplen)) { 
89 ++igmpstat.igps_rcv_badsum; 
90 m freem(m); 
91 return; 
92 H 
93 m-»m data -- iphlen; 
94 m-»m len «- iphlen; 
95 ip - mtod(m, struct ip *); 
96 switch (igmp->igmp type) ( 
157 } 
158 /* 
159 * Pass all valid IGMP packets up to any process(es) listening 
160 * on a raw IGMP socket. 
161 */ 
162 rip_input (m); 
163 } E 
igmp.c 
0 13-16 (0) 
l. IGMP 
52-96 ipintr ( mbuf[] >) m IP 
iphlen 
IGMP (IGMP_MIN_LEN) 
mbuf (m_pullup) IGMP 
igmp_input 
igmp_input igmp_type 13-6 
igmp_type switch igmp type([] 13-7) 
2. |] IGMP IP 
157-163 switch default ( 
rip input rip input IGMP 
IGMP 
mrouted rip input 
13.7.1 IGMP HOST MEMBERSHIP QUERY 
RFC 1075 120 IGMP 
224.0.0.1[] (“ " ) 13-17 
97-122 ( 13.1) E 
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igps_rcv_badqueries 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































igmp.c 
97 case IGMP_HOST_MEMBERSHIP_QUERY: 
98 ++igmpstat.igps_rcv_queries; 
99 if (ifp == &loif) 
100 break; 
101 if (ip->ip_dst.s_addr != igmp_all_hosts_group) { 
102 ++igmpstat.igps_rcv_badqueries; 
103 m freem(m); 
104 return; 
105 } 
106 /* 
107 * Start the timers in all of our membership records for 
108 * the interface on which the query arrived, except those 
109 * that are already running and those that belong to the 
110 * "all-hosts" group. 
111 */ 
112 IN FIRST MULTI (step, inm); 
113 while (inm != NULL) ( 
114 if (inm-»inm ifp == ifp EE inm->inm timer == 0 && 
115 inm->inm addr.s addr !- igmp all hosts group) { 
116 inm->inm timer = 
117  IGMP RANDOM DELAY (inm->inm_addr) ; 
118 igmp timers are, running = 1; 
119 } 
120 IN_NEXT_MULTI (step, inm); 
121 } 
122 break; . 
igmp.c 
U 13-17 IGMP[] D D IJ LJ D LU 0 
IGMP igmp input 
IGMP RANDOM DELAY 
igmp fasttimo 
13.7.2 IGMP HOST MEMBERSHIP REPORT 
IGMP 13.1 IGMP 
13-18 
123-146 
( ) 
igmp report A 0 0 
0 
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TCP/IP 2 
igmp.c 
123 case IGMP_HOST_MEMBERSHIP_REPORT: 
124 ++igmpstat.igps_rcv_reports; 
125 if (ifp == &loif) 
126 break; 
127 if (!IN MULTICAST (ntohl (igmp->igmp_group.s_addr)) || 
128 igmp->igmp_group.s_addr != ip->ip_dst.s_addr) { 
129 ++igmpstat.igps_rcv_badreports; 
130 m freem(m); 
131 return; 
132 } 
133 £t 
134 * KLUDGE: if the IP source address of the report has an 
135 * unspecified (i.e., zero) subnet number, as is allowed for 
136 * a booting host, replace it with the correct subnet number 
137 * so that a process-level multicast routing demon can 
138 * determine which subnet it arrived from. This is necessary 
139 * to compensate for the lack of any way for a process to 
140 * determine the arrival interface of an incoming packet. 
141 */ 
142 if ((ntohl(ip-»ip src.s addr) & IN CLASSA NET) == 0) { 
143 IFP TO.IA(ifp, ia); 
144 if (ia) 
145 ip->ip src.s addr = htonl(ia-»ia subnet); 
146 } 
147 /* 
148 * If we belong to the group being reported, stop 
149 * our timer for that group. 
150 */ 
151 IN_LOOKUP_MULTI (igmp->igmp_group, ifp, inm); 
152 if (inm != NULL) { 
153 inm->inm_timer = 0; 
154 ++igmpstat.igps_rcv_ourreports; 
155 } 
156 break; ` 
igmp.c 
Ú 13-18 IGMPI [] L] U D U D LU D 
13.8 000000 igmp .1eavegroupll[l 
12 in multi 0 in delmulti 
igmp leavegroup 13-19 
179 void Supe 
180 igmp leavegroup(inm) 
181 struct in multi *inm; 
182 ( 
183 /* 
184 * No action required on leaving a group. 
185 */ 
186 ) : 
igmp.c 


O 13-19 igp leavegroup N] 
































13 IGMP[] Internet 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































179-186 | [| IGMP[] | 
IGMP[] IGMP[] 
U 0 U 0 
= ( nn 
icmp leavegroup in delmulti([] 12-36) 
in multi 
13.9 00 
IGMP[] IGMP IP 
IGMP IGMP 
IGMP 
IGMP (U 14 
| 
U U 
13.1 IGMP 
13.2 13-15[] 226[] 229 
13.3 U 0 U 0 
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0140 Tb 0 0 LD 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































141 [ll 
mrouted 
0 0 0 (packet) 
( ) (datagram)[] Net/3 
IP| IP 
14-1[] mrouted BSD sd I D D 
mrouted 1.2 O O 4.3 BSD Tahoe] [] 
2.0 D D D 4.4 BSDO Net/3 
3.3 O O SunOS 4.1.3 
IP 
Net/3 20 O 14-1 mrouted H PO OOO 
3.3 
3.3 
| IP 
Net/3 JOD (LSRR[] Loose 
Source Record Route) (9.6[] ) IP 
3.3 Net/3 
12 UDP 
Internet 
14.2 JO 00 
14-2 
netinet/ip mroute.h 00000 
netinet/ ip_mroute.(c] 00000 
netinet/raw_ip.c 000000 
0142 [000000 
14.21 





























14-3 
































































































































14p IP 31 7 


















































































































































































































































































































































































































































U U 0000 U U 
cached_mrt struct mrt D DD DD" DD DD "DDD D 
cached origin u long “0000” 0000000090 
cached originmask | u long D000” 000000000090 
mrtstat struct mrtstat 000000 
mrttable struct mrt *[] 00000000000000 
numvifs vifi t OOOOOO000 
viftable struct vif[] 0000000090 

0143 0000000090 
14.2.2 
0 14-4[] mrtstat 14-50 0 
netstat -gs 

mrt stat) [| D U SNMP[] OO 

mrts_mrt_lookups pg400000 

mrts_mrt_misses 000000000000 

mrts_grp_lookups 000000 

mrts_grp_misses 0000000000 

mrts no route 0000000000 

mrts bad tunnel 000000000000 

mrts_cant_tunnel O0OOOOOOOOOOOOO 
0144 J0000000 











netstat -gs ] [] mrtstat [] [| 


multicast routing: 


329569328 
9377023 
242754062 


15931 
6 


multicast route lookups 
multicast route cache misses 
group address lookups 


7788 group address cache misses 


5648 datagrams with no route for origin 


mrts_mrt_lookups 
mrts_mrt_misses 


mrts grp lookups 
mrts, grp misses 
mrts, no route 


0 datagrams with malformed tunnel options mrts bad tunnel 
0 datagrams with no room for tunnel options | mrts, cant, tunnel 





0145 PODALO OD 


Bunun 








[] 98% 




































































































































































34% 14-34 




































































14-21 










































































14.2.3 SNMP| 









































SNMP MIB 























Farinacci 1994b] 














[McCloghrie[] Farinacci 1994a] [McCloghrie[] 













































































MIB 











143 JI0000(0) 

















12.15 







































































































































































ip moptions 
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ip output 


TCP/IP 2 





































































































ip output 







































































| ip output 
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ipintr | 














































































































































































































































































































































































































































































































































































































































































































































































































































U U 0o00 
0146 0000000000 
14-6 
ip_mloopback 
ip_mforward 14-6 
ip_output 
ip mforward|| ip mforward 
ip output i 
14-7 i 
ip mforward ip output S 












































| | IP FORWARDING 











































































































































































































































































































































































































































































































































































































































































































































































































: 4 
ip output utl 00 000 
ip_mforward 
14-7 
12-42 ip mloopback[] 14.8 d 00000000000 
ip_mforward 
14.4 mrouted| ||] [] 
mrouted mrouted IGMP 
mrouted 
mrouted = mrouted 
TRPB(Truncated Reverse Path Broadcast) 
[Deering[] Cheriton 1990] | [ U | 
DVMRP 





















































































































































14 
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IP 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































RFC 1075 [Waitzman[] Partidge [| Deering1988] [| DVMRP mrouted 
| DVMRP RFC 
mroutedl[] Bl] 
mrouted O HEB IGMP (0 320 )[ E 
14-8 
optname optval] Ü O 0 [] U 
DVMRP INIT ip_mrouter_init mrouted[] [] 
DVMRP_DONE ip_mrouter_done mrouted 9 0 
DVMRP_ADD_VIF struct vifctl add_vif 00000 
DVMRP_DEL_VIF vifi_t del_vif 000000 
DVMRP_ADD_LGRP struct lgrplctl add lgrp 000000000000 
DVMRP DEL LGRP struct lgrplct]l del_lgrp 000000000000 
DVMRP_ADD_MRT struct mrtctl add_mrt 000000 
DVMRP DEL MRT struct in addr| del mrt üggauu 
0148 1 IU D 1 T TD D 
14-8 setsockopt[] J] rip ctloutput(32.8[] )| 14-9 
DVMRP xxx rip. ctloutputl[] | 
raw ip.c 
173 case DVMRP INIT: 
174 case DVMRP DONE: 
175 case DVMRP ADD VIF: 
176 case DVMRP DEL VIF: 
177 case DVMRP ADD LGRP: 
178 case DVMRP. DEL LGRP: 
179 case DVMRP ADD, MRT: 
180 case DVMRP DEL MRT: 
181 if (op == PRCO_SETOPT) ( 
182 error - ip mrouter cmd(optname, so, *m); 
183 if (*m) 
184 (void) m free(*m); 
185 ) else 
186 error - EINVAL; 
187 return (error); : 
raw ip.c 
[] 14-9 rip ctloutput [0 0 0 De xxx [] Ú LI Ú 
173-187 [| setsockopt[| [| op PRCO_SETOPT 
ip_mrouter_cmd getsockopt [] op PRCO_GETOPT 
EINVAL 
14-10 ip_mrouter_cmd 
- ip_mroute.c 
84 int 
85 ip_mrouter_cmd(cmd, so, m) 
86 int cmd; 
87 struct socket *so; 
88 struct mbuf *m; 
89 ( 
90 int error = 0; 


O 14-10 ip mrouter cmd [00 


91 
92 
93 
94 


95 
96 
97 


98 
99 
100 


101 
102 
103 
104 
105 
106 


107 
108 
109 
110 
111 
112 
113 
114 
115 
116 
117 
118 


119 
120 
121 
122 
123 
124 


125 
126 
127 
128 
129 
130 


131 
132 
133 
134 
135 
136 


137 
138 
139 
140 
141 
142 T 
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EE —1Áiij 


if (cmd != DVMRP_INIT && so != ip_mrouter) 
error = EACCES; 

else 
switch (cmd) { 


case DVMRP_INIT: 
error = ip_mrouter_init (so); 
break; 


case DVMRP_DONE: 
error = ip mrouter done(); 
break; 


case DVMRP ADD VIF: 
if (m == NULL || m->m len < sizeof (struct vifctl)) 
error = EINVAL; 
else 
error = add vif (mt od (m, struct vifctl *)); 
break; 


case DVMRP DEL VIF: 
if (m == NULL || m->m len < sizeof (short)) 
error = EINVAL; 


else 
error = del vif(mtod(m, vifi t *)); 
break; 
case DVMRP ADD LGRP: 
if (m == NULL || m-»m len < sizeof (struct lgrplctl)) 
error = EINVAL; 
else 
error = add lgrp(mtod(m, struct lgrplctl *)); 
break; 


Case DVMRP DEL LGRP: 
if (m -- NULL || m-»m len « sizeof(struct lgrplctl)) 
error = EINVAL; 
else 
error = del lgrp(mtod(m, struct lgrplctl *)); 
break; 


case DVMRP ADD MRT: 
if (m -- NULL || m-»m len « sizeof(struct mrtctl)) 
error - EINVAL; 
else 
error - add mrt(mtod(m, struct mrtctl *)); 
break; 


case DVMRP DEL, MRT: 
if (m == NULL || m-»m len « sizeof(struct in_addr)) 
error - EINVAL; 


else 
error = del mrt(mtod(m, struct in_addr *)); 
break; 
default: 
error = EOPNOTSUPP; . 
break; 


} 
return (error); 


— ——— np mroute.c 


U 14-10 (0) 





Chinaspubecom m moo 321 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































(command) 
84-92 mrouted DVMRP_INIT 
DVMRP_INIT EACCES 
94-142 switch | [] case 0 | | L | 
U U EOPNOTSUPP UDE error 
mrouted DVMRP INIT 14-11 ip mrouter init 
—— ip_mroute.c 
146 static int 
147 ip_mrouter_init (so) 
148 struct socket *so; 
149 { 
150 if (so->so type != SOCK_RAW || 
151 so->so_proto->pr_protocol != IPPROTO_IGMP) 
152 return (EOPNOTSUPP); 
153 if (ip_mrouter != NULL) 
154 return (EADDRINUSE); 
155 ip_mrouter = so; 
156 return (0); 
157 ) š 
ip mroute.c 
O 14-11 ip mrouter init [| [| [| DVMRP INIT [|] [| 
146-157 O IGMPD DI O00 DVMRP_INIT n 
EOPNOTSUPP|| EADDRINUSE ip_mrouter 
mrouted 
u O O DVMRP xxx] 
14.5 0000 
Net/3 
-—— 
OOOOLSRRO B D 'PD D D 0 
src-HS src=HS src=HS 
dst=G dst=T, dst=G 
YU DD: O O LSRRO PO O O D LSRRO 
U D D 0 LSRR[] (TS,G) (000 


0 14-12 0000 









































SUE amn Chinasbub.com 
— A DD 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































14-12 
14-12 A HS G G B 
A A ( ) 
A IP T| B 
IP T, LSRR 
IP 14-130 H IP LSRR 
00 PQ D 00000 0 0 






























D B Ag 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































T, HS T,*G DU du 
T HS T, OOO 0000 BO ip_dooptions] D 
T, HS 0000 BO ip_mforward] O 
O 14-13 ESRR 000090 
14-13 HS A A 
A[] IP LSRR 
A LSRR 
T,—— LSRR 
B 
B ip. dooptions 9 
ip dooptions[| ipintr LSRR 
(T,) B ip. dooptions ( G) 
IP Gl] ip rtaddr 
ip rtaddr IP ( G) 
ip mforward ip dooptions 
14-13 ipintr ip mforward LSRR 
ip mforward 
B HG 
LSRR 1993[] 3 mrouted 
IP IP IP 4 
IP RFC 1700 ——" IP IP" 
mrouted LSRR 
14.5.1 0 | 




































































(virtual interface) 











































































































































































































14-14) 
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vif 












































































































































Chinaspubecom xu EE 























































































































































































































































































































































































































































































































































































































































































































































































































viftable vifi_t 
i ip mroute.h 
105 struct vif { 
106 u Char v flags; /* VIFF flags */ 
107 u Char v threshold; /* min ttl required to forward on vif */ 
108 struct in_addr v. lcl addr; /* local interface address */ 
109 struct in_addr v_rmt_addr; /* remote address (tunnels only) */ 
110 struct ifnet *v ifp; /* pointer to interface */ 
111 struct in_addr *v_lcl_grps; /* list of local grps (phyints only) */ 
112 int v_lcl_grps_max; /* malloc’ed number of v_lcl_grps */ 
113 int v. lcl grps n; /* used number of v lcl grps */ 
114 u long v cached group; /* last grp looked-up (phyints only) */ 
115 int v cached, result; /* last look-up result (phyints only) */ 
116 ); . 
ip mroute.h 
O 14-14 vif H 
105-110 v flags VIFF TUNNEL 
v threshold 
12.9 v lcl addr IP 
v rmt addr IP IP v lcl addr v rmt addr 
v ifp ifnet 
v ifp 





























viftable: 


viftable[0]4 Us 


v. lcl grps max 


viftable[1] 


viftable[2] 


viftable[3] 


U 
viftable[31] 





O 14-15 viftable DI 


324 





China-pubscom 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
111-116 v_lcl_grps IP 
v lcl grps v lcl grps max 
v lcl grps n 
v cached. droup v. cached, result “ É 
14-15 viftable 32[] (MAXVIFS) viftable[2] 
numvifs[] 3 
vif v_ifp ifnet v lcl grps in addr 
32(v lcl grps max) 4[] (v. 1c1. grps. n) 
mrouted DVMRP ADD VIF|| DVMRP DEL VIF viftable 
mrouted mrouted 
/etc/mrouted.conf 
mrouted[| DVMRP ADD VIF ctl (U 14-16) 
ip mroute.h 
76 struct vifctl ( 
71 vifi t vifc vifi; . /* the index of the vif to be added */ 
78 u_char vifc flags; /* VIFF flags (Figure 14.14) */ 
79 u_char vifc threshold; /* min ttl required to forward on vif */ 
80 struct in_addr vifc lcl addr; /* local interface address */ 
81 struct in, addr vifc rmt addr; /* remote address (tunnels only) */ 
2 33 = 
an ip_mroute.h 
[ 14-16 vifctl DI 
78-82 vifc vifi viftable 4 vifc flags 
vifc_threshold| | vifc lcl addr|| vifc rmt addr add vif vif 
14.5.2 add vif 
14-17[] add vif 
ip mroute.c 





202 static int 


203 add vif(vifcp) 
204 struct vifctl *vifcp; 


205 
206 
207 
208 
209 
210 
211 
212 


213 
214 
215 
216 


t 


struct vif *vifp = viftable + vifcp-»vifc vifi; 
Struct ifaddr *ifa; 

struct ifnet *ifp; 

struct ifreq ifr; 

int error, S; 

static struct sockaddr in sin - 

(sizeof(sin), AF INET); 


if (vifcp-»vifc vifi »- MAXVIFS) 


return (EINVAL); 


if (vifp->v lcl, addr.s addr != 0) 


return (EADDRINUSE); 
U 14-17 add vif [][] [| DVMRP ADD vr T 











abu tO N my 

























































































325 



















































































































































































































































































































































































































































































































































































































































































































































































217 /* Find the interface with an address in AF_INET family */ 
218 sin.sin_addr = vifcp->vifc lcl addr; 
219 ifa = ifa ifwithaddr((struct sockaddr *) &sin); 
220 if (ifa == 0) 
221 return (EADDRNOTAVAIL) ; 
222 s = splnet (); 
223 if (vifcp->vifc_flags & VIFF_TUNNEL) 
224 vifp->v_rmt_addr = vifcp->vifc_rmt_addr; 
225 else {. 
226 /* Make sure the interface supports multicast */ 
227 ifp = ifa->ifa_ifp; 
228 if ((ifp->if_flags & IFF_MULTICAST) == 0) { 
229 splx(s); 
230 return (EOPNOTSUPP); 
231 ) mE 
232 /* 
233 * Enable promiscuous reception of all IP multicasts 
234 * from the interface. 
235 */ 
236 satosin(&ifr.ifr addr)->sin family = AF INET; 
237 satosin(&ifr.ifr addr)->sin addr.s addr = INADDR ANY; 
238 error = (*ifp->if_ioctl) (ifp, SIOCADDMULTI, (caddr t) & ifr); 
239 if (error) ( 
240 splx(s); 
241 return (error); 
242 } 
243 } 
244 vifp->v_flags = vifcp->vifc_flags; 
245 vifp->v_threshold = vifcp->vifc_threshold; 
246 vifp->v_lcl_addr = vifcp-»vifc, lcl addr; 
247 vifp->v ifp = ifa->ifa_ifp; 
248 /* Adjust numvifs up if the vifi is higher than numvifs */ 
249 if (numvifs <= vifcp->vifc_vifi) 
250 numvifs = vifcp-»vifc vifi + 1; 
251 splx(s); 
252 return (0); 
=) ip_mroute.c 
14-17 (0) 
1. 
202-216 mrouted vifc_vifi 
EINVAL|| EADDRINUSE 
2. 
217-221 ifa_ifwithaddr vifc lcl addr IP 
ifnet 
EADDRNOTAVAIL 
3. 
222-224 vifctl vif 
4. 
22 5=243 SIOCADDMULTI 

























































































































































































326 TCP/IP 2 China-pubcom 
— — a 
























































































































































































































































INADDR_ANY IP ([] 12-32) 
ipintr ip mforward ip mforward 
5. 
244-253 vifctl vif numvifs 


















































































































































































































































14.5.3 del vif[] 


























































































































































































































































































































































































































14-18 del vif mrouted DVMRP ` 
DEL VIF 
1. 
257-268 del_vif | 
EINVAL[] EADDRNOTAVAIL 






























































ip_mroute.c 


257 static int 
258 del vif(vifip) 
259 vifi t *vifip; 


260 ( 
261 
262 
263 
264 


265 
266 
267 
268 


269 


struct vif *vifp = viftable + *vifip; 
struct ifnet *ifp; 

int i, s; 

struct ifreg ifr; 


if (*vifip >= numvifs) 
return (EINVAL); 

if (vifp-»v lcl addr.s addr == 0) 
return (EADDRNOTAVAIL); 


s = splnet(); 


if (!(vifp->v flags & VIFF TUNNEL)) { 
if (vifp-»v lcl grps) 
free(vifp->v lcl grps, M MRTABLE); 
satosin(&ifr.ifr addr)->sin family = AF INET; 
satosin(&ifr.ifr addr)->sin addr.s addr = INADDR ANY; 
ifp = vifp-»v ifp; 
(*ifp->if ioctl) (ifp, SIOCDELMULTI, (caddr t) & ifr); 
3 
bzero((caddr t) vifp, sizeof(*vifp)); 


/* Adjust numvifs down */ 
for (i = numvifs - 1; i >= 0; i--) 
if (viftable[i].v lcl addr.s addr != 0) 
break; 
numvifs = i + 1; 


splx(s); 
return (0); 





O 14-18 del vif [][] [| DVMRP DEL VIF [| [| 


























269=278 SIOCADDMULTI 























































































































































































































viftable 











Chinaspubecom wami NA 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































v. lcl addr( in addr JO O s addr[] 0 
numvifs | 
14.6 IGMP(D) 
13 IGMP mrouted mrouted 
mroutead[] 120 
IGMP HOST MEMBERSHIP QUERY IGMP HOST MEMBERSHIP REPORT 
13 
mrouted | 
14-14 v lcl grps IP mrouted[| DVMRP . 
ADD LGRP|| DVMRP DEL LGRP lgrpctl 
([] 14-19) 




















ip mroute.h 
87 struct lgrplctl { 










88 vifi.t gc vifi; 
89 struct in_addr igc gaddr; 
90 y; S 
: ip mroute.h 
U 14-19 Igrpct1 [| [| 
DO 
pp. 775 M a ooo CUT 


DVMRP ADD LGRP OM 
setsockopt 


rip_ctloutput 
1p_mroute_cmd 





IGMP_HOST_MEMBERSHIP_REPORT 


000 


D 14-20 IGMPO D n D 


328 















































Chlnapubscom 









































































































































































































































































































































































































































































































































TCP/IP 2 
87-90 lgc_vifill lgc_gaddr { } ( lgc_vifi) 
IGMP_HOST_MEMBERSHIP_REPORT 14-20 
14.6.1 add_lgrp 
mrouted IGMP 
ip_mroute.c 


291 static int 
292 add lgrp(gcp) 
293 struct lgrplctl *gcp; 


294 ( 
295 
296 


297 
298 


299 
300 
301 


302 
303 
304 
305 
306 


307 
308 
309 
310 
311 
312 
313 
314 
315 
316 
317 
318 
319 
320 


321 
322 
323 
324 


325 
326 
327 


328 
329 


330 
331 
332 } 


struct vif *vifp; 


int 


Si 


if (gep->lge vifi >= numvifs) 


vifp 
if (vifp-»v lcl addr.s addr == 0 |i 


return (EINVAL); 


= viftable + gcp->1gc_vifi; 


return (EADDRNOTAVAIL); 


(vifp->v flags & VIFF_TUNNEL)) 


/* If not enough space in existing list, allocate a larger one */ 


s = 


splnet(); 


if (vifp-»v lcl grps n + 1 >= vifp-»v lcl grps max) { 


} 


vifp->v_1c1_grps [vifp->v_1c1_grps_n++] 


int num; 
struct in_addr *ip; 


num = vifp->v lcl grps max; 
if (num <= 0) 
num = 32; 
else 
num += num; 


/* initial number */ 


/* double last number */ 


ip = (struct in addr *) malloc(num * sizeof(*ip), 
M MRTABLE, M_NOWAIT); 


if (ip == NULL) { 
splx(s); 
return (ENOBUFS); 
} 
bzero((caddr t) 
bcopy((caddr t) vifp->v lcl grps, 


vifp-»v lcl grps n * sizeof(*ip)): 


vifp-»v lcl grps max = num; 
if (vifp-»v. lcl, grps) 


free(vifp-»v lcl grps, M MRTABLE); 


vifp-»v lcl grps = ip; 


splx(s); 


ip, num * sizeof(*ip)); 


/* XXX paranoid */ 


(caddr_t) ip, 


gcp-»1gc gaddr; 


if (gcp->lgc gaddr.s addr -- vifp-»v cached group) 


vifp-»v cached result - 1; 


splx(s); 
return (0); 





D 14-21 


— ip_mroute.c 


add lgrp [| [| [| DVMRP_ADD GRP [| [J 








14 IP 























329 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































mrouted DVMRP_ADD_LGRP 
14-21 add_lgrp 
1. 
291-301 EINVAL 
EADDRNOTAVAIL 
2. 
302-326 
add lgrp 32 
add lgrp Malloc 
bzero bcopy 
v lcl grps max ( ) v lcl grps vif 
" (paranoid)" malloc 
3. 
327-332 
v cached group 
v cached result[] grplst_member|] [] 
L [| v_cached_groupl] 
14.6.2 del_lgrpl] |] 
270 
mrouted DVMRP DEL LGRP 14-22 
del_lgrp 
1. 
337=347 EINVAL 
EADDRNOTAVAIL 
2. 
348-350 oq] ) 
3. 
351-364 error EADDRNOTAVAIL[] for 
same( bcmp ) 
error 1] bcopy del_lgrp 






















































































































































































































































































EADDRNOTAVAIL 






















































































330 TCP/IP 2 China+pub.tom 
— — ta 






















































































































































































































































































































































































i Å 
337 static int p-mroute,c 

338 del lgrp(gcp) 

339 struct igrplctl *gcp; 

340 ( 

341 struct vif *vifp; 

342 int i, error, s; 

343 if (gcp-»1gc vifi >= numvifs) 

344 return (EINVAL); 

345 vifp = viftable + gcp-»lgc, vifi; 

346 if (vifp->v lcl addr.s addr == 0 || (vifp->v flags & VIFF TUNNEL)) 

347 return (EADDRNOTAVAIL); 

348 S - splnet(); 

349 if (gcp-»1gc gaddr.s addr == vifp->v cached group) 

350 vifp-»v cached result - 0; 

351 error - EADDRNOTAVAIL; 

352 for (i = 0; i « vifp-»v lcl grps n; ++i) 

353 if (same(&gcp->lgc_gaddr, &vifp-»v icl grps[il)) I 

354 error - 0; 

355 vifp->v lcl.grps n--; 

356 bcopy((caddr t) & vifp-»v Lei grps[i + 1], 

357 (caddr t) & vifp-»v lcl grps[i], 

358 (vifp->v lcl grps n - i) * sizeof (struct in addr)); 

359 error - 0; 

360 break; 

361 } 

362 splx(s); 

363 return (error); 

364 } å 

ip mroute.c 
O 14-22 del jop [| [| opp DEL_LGRE] O 
14.6.3 grplst member 
14- 
23 grplst member 
ip mroute.c 





368 static int 

369 grpist member (vifp, gaddr) 
370 struct vif *vifp; 

371 struct in addr gaddr: 


372 L 

373 int i, s; 

374 u long addr; 

375 mrtstat.mrts grp lookups++; 

376 addr = gaddr.s addr; 

377 if (addr == vifp-»v cached group) 

378 return (vifp->v cached result); 

379 mrtstat.mrts grp misses4-; 

380 for (i = 0; i < vifp-»v lcl grps n; ++i) 


O 14-23 grplst member [|] [| 





China-bubcom "P 331 














































































































































































































































































































































































































































































































































































































381 if (addr == vifp-»v.1cl grps[il.s addr) { 

382 S = splnet(); 

383 vifp-»v cached group - addr; 

384 vifp-»v cached result - 1; 

385 > splx(s); 

386 return (1); 

387 } 

388 s = splnet(); 

389 vifp->v_cached_group = addr; 

390 vifp->v_cached_result = 0; 

391 splx(s); 

392 return (0); 

393 } . 

ip mroute.c 
D 14-23 (0) 
1. 
368-379 
2, 
380-390 
1 0 
14.7 DO DD 
mrouted TRPB 



























































































































































14-24 






































































































































































































































































































































































































































































































































































































































































































































































































































01424 D D D H DD 
14-24 D 
D C CHO C AI B 
E 
14-25 
A S 
[Tanenbaum 1989] [Perlman 1992] 




















































































































332 TCP/IP 2 Chibasbub to 
— MA 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































U 1425 ID ALI L1 LI D 

A (reverse path) 
14-25 BJ € A 
B[] € 

C B 
RFC 1075 
(reverse path broadcast)|| RPB 
RPB 
(TRPB)[] 2.0 mrouted[] IGMP 
14-26 TRPB C B 
14-26 Net/3 























































































































































































































0 14-26 0 0 cg TRPBO 0O00 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































C AI B CH D 
CU D 
A Bl] DJ E C A 
B[] E = AQ E TRPB 
C C C 
C AJ Bl] E A C 
A 
AJ DJ E 
B 
B B 
viftable 
(reverse path multicasting 
RPM)[] RPM (prune) 
14-26 RPM C[] A[] E 
3.3 mrouted RPM 
14-27 RPM 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Net/3 DVMRP DVMRP IGMP 
224.0.0.4 DVMRP ( 12-1) 
12-39 IGMP 
igmp input[] rip input mrouted IGMP mrouted 
DVMRP IGMP 
RPB[] TRPB[] RPM DVMRP [Deering 
Cheriton 1990] [| mrouted 
Internet Proteon RFC 1584 [Moy 1994] 
MOSPF Cisco 10.2 PIM(Protocol Independent 
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Multicasting)[] [Deering et al1994] PIM 
14.7.1 
Net/3 64 
(MRTHASHIZ) mrttable 
mrt 14-28 
ip_mroute.h 
120 struct mrt { 2 
121 Struct in addr mrt origin; /* subnet origin of multicasts */ 
122 Struct in, addr mrt originmask;  /* subnet mask for origin */ 
123 vifi t mrt, parent; /* incoming vif */ 
124 vifbitmap t mrt children; /* outgoing children vifs */ 
125 vifbitmap t mrt leaves; /* gubset of outgoing children vifs */ 
126 struct mrt *mrt next; /* forward link */ 
127 ); < 
Ñ ip_mroute.h 
0 14-28 mrt [] [| 
120-127 mrtc origin[| mrtc_originmask mrtc parent 
mrtc children 
mrtc leaves 
mrt next 
14-29 mrt 
nethash([] 14-31) 
mrttable: mrt() mrt() mrt() 
0 










mrt{} 


mrttable[5] 


U 
mrttable[62] 








63 



































































































































































































































































































































































































































01429 90009 
mrouted 
DVMRP_ADD_MRT 14-30 mrtctl 
95-101 mrtctl 5 mrouted ([] 14-28) 
IP nethash([] 14-31) 
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IP 0-63 (MRTHASHSIZ- 1) 
ip_mroute.h 
95 struct mrtctl { 
96 struct in_addr mrtc_origin; /* subnet origin of multicasts */ 
97 struct in_addr mrtc_originmask; /* subnet mask for origin */ 
98 vifi_t mrtc_parent; /* incoming vif */ 
99 vifbitmap_t mrtc_children; /* outgoing children vifs */ 
100 vifbitmap_t mrtc_leaves; /* subset of outgoing children vifs */ 
101 T: . 
ip mroute.h 
O 14-30 mrtctl [] [| 
s ip_mroute.c 
398 static u long 
399 nethash(in) 
400 struct in_addr in; 
401 ( 
402 u long n; 
403 n = in netof (in); 
404 while ((n & Oxff) == 0) 
405 n >>= 8; 
406 return (MRTHASHMOD(n)); 
407 ) š 
ip_mroute.c 
[] 14-31 nethash [] [] 
398-407 in netof in 0 n A[] B[] C 
8 MRTHASHMOD 
#define MRTHASHMOD(h) ((h) & (MRTHASHSIZ - 1)) 
8 63 6 0-63 
(nethash[] in. netof) 32 bit 
14.7.2 del mrt 
mrouted DVMRP ADD MRT[|| DVMRP DEL MRT 
14-32 del mrt 
— ip_mroute.c 
451 static int 
452 del mrt (origin) 
453 struct in addr *origin; 
454 { 
455 struct mrt *rt, *prev rt; 
456 u long hash = nethash(*origin); 
457 int S; 
458 for (prev rt - rt - mrttable[hash]; rt; prev rt - rt, rt - rt-»mrt next) 
459 if (origin-»s addr -- rt-»mrt origin.s addr) 
460 break; 
461 if (!rt) 
462 return (ESRCH); 
463 S - splnet(); i 





0 14-32 del mrt 90 0 DVMRP DEL MT OG 















































336 reenn n: China-pubıcom 
— Eg 







































































































































































































































































































































































































































































































































































































































































464 if (rt == cached mrt) 
465 cached mrt = NULL; 
466 if (prev rt == rt) 
467 mrttable[hash] = rt->mrt next; 
468 else 
469 prev rt->mrt next = rt->mrt next; 
470 free(rt, M MRTABLE); 
471 splx(s); 
472 return (0); 
473 } ; 
ip_mroute.c 
0 14-32 (O) 
1. 
451-462 for hash (| nethash ) 
ESRCH 
2. 
463-473 
3f 
14.7.3 add mrt 
add mrt 14-33 
ip mroute.c 


411 static int 
412 add mrt (mrtcp) 
413 struct mrtctl *mrtcp; 


414 ( 
415 
416 
417 


418 
419 
420 
421 
422 
423 
424 
425 
426 
427 


428 
429 
430 
431 
432 
433 
434 
435 
436 
437 
438 


struct mrt *rt; 
u long hash; 
int s; 


if (rt = mrtfind(mrtcp->mrtc_origin)) ( 
/* Just update the route */ 
s = splnet(); 
rt->mrt_parent = mrtcp->mrtc_parent; 
VIFM_COPY (mrtcp->mrtc_children, rt->mrt_children); 
VIFM COPY (mrtcp->mrtc leaves, rt->mrt_leaves); 
splx(s); i 
return (0); 


} 
S = spinet (); 


rt = (struct mrt +) malloc(sizeof(*rt), M_MRTABLE, M NOWAIT); 
if (rt == NULL) { 
splx(s); 
return (ENOBUFS); 
} 
/* 
* insert new entry at head of hash chain 
*/ 
rt-»mrt origin - mrtcp-»mrtc origin; 
rt-»mrt originmask - mrtcp-»mrtc originmask; 
rt-»mrt parent - mrtcp-»mrtc parent; 


[] 14-33 add mrt 00000 DVMRP_ADD MRT DJ 
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439 VIFM_COPY (mrtcp->mrtc_children, rt->mrt_children); 
440 VIFM COPY(mrtcp-»mrtc leaves, rt-»mrt leaves); 
441 /* link into table */ 
442 hash - nethash(mrtcp-»mrtc origin); 
443 rt-»mrt next = mrttable[hash]; 
444 mrttable[hash] = rt; 
445 splx(s); 
446 return (0); 
447 } : 
p mroute.c 
H 14-33 (0) 
1. 
411-427 add mrt 
2. 
428-447 mbuf mrtctl mrt 
mrtc_origin 
14.7.4 mrtfind[] 
mrtfind 14-34 mrtfind 
mrtfind mrt 
1. 
477-488 IP (orgin) 
cached origin 
i ip mroute.c 
477 static struct mrt * 
478 mrtfind(origin) 
479 struct in_addr origin; 
480 { : 
481 struct mrt *rt; 
482 u int hash; 
483 int s; 
484 mrtstat.mrts_mrt_lookups++; 
485 if (cached mrt != NULL && 
486 (origin.s_addr & cached_originmask) == cached_origin) 
487 return (cached mrt); 
488 mrtstat.mrts mrt misses++; 
489 hash - nethash(origin); 
490 for (rt - mrttable[hash]; rt; rt - rt-»mrt next) 
491 if ((origin.s addr & rt-»mrt originmask.s addr) -- 
492 rt-»mrt origin.s addr) ( 
493 S = splnet (1: 
494 cached_nrt = rt; 
495 cached_origin = rt->mrt_origin.s_addr; 
496 cached_originmask = rt->mrt_originmask.s_addr; 
497 splx(s); 
498 return (rt); 
499 } 
500 return (NULL); 
501 } š 
ip_mroute.c 


O 14-34 mrtfind [] [] 
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489-501 nethash for 
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12-39 ip mrouter 
mrouted ipintr ip mforward 
12-40 ip output ip 
mforward ip mforward ip output 
14-35 









































































































































00000 ipintr 





OU 
(O 14-39) 






ipintrg: ne 








tunnel_send 


CEumne1 send 
Cebyint send) 


















































































































































































































































































































































































































































































































































































































































































































0000 00 Don 
01435 O0000000000000 
14-35 
ip mforward 
( ) 
14-36 
14-36 
ip mforward 14-37 
ip mforward ipintr 
ip mforward 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































14-36 ip output 
ip mloopback[]| ip mloopback[] | ipintr ( 
ip mforward ( 14.4) 
ip_mforward UL ) ipintr 


























































































































































































































000000 
(O 14-39) 


ip_mloopback 


O000000000000 
O000000000 




















































































































































































































(0000 DO O00 
01436 IO0000000000000 

. ( 14-37) 

° (O 14-39) 

. ( 14-40) 

- ip_mroute.c 

516 int 
517 ip_mforward(m, ifp) 
518 struct mbuf *m; 
519 struct ifnet *ifp; 
520 { 
521 struct ip tip = mtod(m, struct ip *); 
522 struct mrt *rt; 
523 struct vif *vifp; 
524 int vifi; 
525 u_char *ipoptions; 
526 u_long tunnel_src; 
527 if (ip->ip_hl < (IP_HDR_LEN + TUNNEL_LEN) >> 2 || 
528 (ipoptions = (u char zi (ip + 1)) [1] !- IPOPT LSRR) { 
529 /* Packet arrived via a physical interface. */ 
530 tunnel src = 0; 
531 } else { 
532 /* 
533 * Packet arrived through a tunnel. 
534 * A tunneled packet has a single NOP option and a 


0 14-37 ip mforwrd 0020000090 








340 
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535 * two-element loose-source-and-record-route (LSRR) 
536 * option immediately following the fixed-size part of 
537 * the IP header. At this point in processing, the IP 
538 * header should contain the following IP addresses: 
539 * 
540 * original source - in the source address field 
541 * destination group - in the destination address field 
542 * remote tunnel end-point — in the first element of LSRR 
543 * one of this host's addrs - in the second element of LSRR 
544 * 
545 * NOTE: RFC-1075 would have the original source and 
546 * remote tunnel end-point addresses swapped. However, 
547 * that could cause delivery of ICMP error messages to 
548 * innocent applications on intermediate routing 
549 * hosts! Therefore, we hereby change the spec. 
550 */ 
551 /* Verify that the tunnel options are well-formed. */ 
552 if (ipoptions[0] != IPOPT_NOP || 
553 ipoptions[2] != 11 || /* LSRR option length */ 
554 ipoptions[3] != 12 || /* LSRR address pointer */ 
555 (tunnel src = *(u long +) (&ipoptions[41)) == 0) L 
556 mrtstat.mrts bad tunnel++; 
557 å return (1); 
558 } 
559 /* Delete the tunnel options from the packet. */ 
560 ovbcopy((caddr t) (ipoptions + TUNNEL LEN), (caddr t) ipoptions, 
561 (unsigned) (m-»m len - (IP HDR LEN + TUNNEL LEN))); 
562 m-»m len -- TUNNEL LEN; 
563 ip->ip len -= TUNNEL LEN; 
564 ip->ip_hl -= TUNNEL LEN >> 2; 
565 ) 3 
ip_mroute.c 
0 14-37 (0) 
516-526 ip_mforward mbu 
ifnet 
1. 
527-530 IP 
LSRR LSRR 
NOP tunnel_src 0 
2: 
531-558 
ip_mforward 1 14-38 
14-38 
IP LSRR LSRR 
3. 
559-565 mbuf| m len[] IP 
ip len[] ip hl (O 14-38) 
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11 (length) 
— 12(offset) 


































































































































































































































































































































































































































































































































































































200 0 
01438 000000 
ip_mforward tunnel_source 
ip_mforward ipintr 
ip_mforward ipintr 
ip_output 
ip_output ip_mloopback 
ip_mforward 14-39 
ip_mroute.c 
566 /* 
567 * Don't forward a packet with time-to-live of zero or one, 
568 * or a packet destined to a local-only group. 
569 */ 
570 if (ip-»ip ttl <= 1 | 
571 ntohl (ip->ip_dst.s_addr) <= INADDR_MAX_LOCAL_GROUP) 
572 return ((int) tunnel_src); 
573 /* 
574 * Don’t forward if we don’t have a route for the packet’s origin. 
575 */ 
576 I if (! (xt = mrtfind(ip->ip_src))) L 
577 mrtstat.mrts no route++; 
: 578 return ((int) tunnel src); 
579 } 
580 /* 
581 * Don’t forward if it didn’t arrive from the parent vif for its origin. 
582 */ 
583 vifi = rt->mrt parent; 
584 if (tunnel_src == 0) { 
585 if'((viftable[vifi].v flags & VIFF TUNNEL) || 
586 viftable[vifi].v_ifp !- ifp) 
587 return ((int) tunnel_src); 
588 } else { 
589 if (!(viftable[vifi].v flags & VIFF TUNNEL) || 
590 viftable[vifi].v rmt addr.s addr != tunnel src) 
591 return ((int) tunnel src); 
592 } š 
ip_mroute.c 


0 14-39 ip mforward [000000000 
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4. TTL 
566-572 ip tti OG 1 
INADDR MAX LOCAL GROUP( 224.0.0.x 12-1) 
tunnel src 
3.3 mrouted 
224.0.0.x 
5. 
573-579 mrtfind 
mrouted 
6. 
580-592 
ip_mforward 
ip_mforward 
ip_mforward (O 14-40) 
————————————————————————————————— ip mroute.c 
593 FX 
594 * For each vif, decide if a copy of the packet should be forwarded. 
595 * Forward if: . 
596 u - the ttl exceeds the vif’s threshold AND 
597 * - the vif is a child in the origin’s route AND 
598 * - ( the vif is not a leaf in the origin's route OR 
599 * the destination group has members on the vif ] 
600 * 
601 * (This might be speeded up with some sort of cache -- someday.) 
602 *f 
603 for (vifp = viftable, vifi = 0; vifi « numvifs; vifp++, vifi++) ( 
604 if (ip-»ip ttl > vifp->v threshold && 
605 VIFM ISSET(vifi, rt->mrt children) && 
606 (IVIFM ISSET(vifi, rt->mrt leaves) || 
607 arplst member (vifp, ip->ip_dst))) { 
608 if (vifp->v_flags & VIFF TUNNEL) 
609 tunnel send(m, vifp); 
610 else 
611 phyint send(m, vifp); 
612 ) 
613 } 
614 return ((int) tunnel src); 
615 ) 
I IH mroute.c 
[ 14-40 ip mforward T) U D 
593-615 viftable 
























































































































































TTL 














































































































14 IP 
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grplst member 


tunnel send phyint_send 


14.8.1 






























































































































































































































































phyint_send|| 














































































































phyint send([] 14-41) 


























ip output 








ip moptions 




























































































616 static void 

617 phyint send(m, vifp) 
618 struct mbuf *m; 

619 struct vif *vifp; 


ip mroute.c 


ip mroute.c 






































































































































































































































620 ( 

621 struct ip *ip = mtod(m, struct ip *); 

622 struct mbuf *mb copy; 

623 struct ip_moptions *imo; 

624 int error; 

625 struct ip moptions simo; 

626 mb copy = m copy(m, 0, M COPYALL) ; 

627 if (mb copy -- NULL) 

628 return; 

629 imo - &simo; 

630 imo->imo_multicast_ifp = vifp-»v ifp: 

631 imo-»imo multicast ttl = ip-»ip ttl - 1; 

632 imo-»imo multicast loop = 1; 

633 error ip output (mb copy, NULL, NULL, IP FORWARDING, 

634 ) 

U 14-41 phyint send U 
616-634 m copy ip moptions 
TTL | 
ip output IP FORWARDING 

ip output ip mforward 

















































































































m next 


200 O 
014422 O00000 





























344 TCP/IP 2 


14.8.2 tunnel send 


China-pubscom 
































































































































tunnel_send({] 14-43) 



























































































































































14-42 tunnel_send 
































ip_mroute.c 


635 static void 

636 tunnel_send(m, vifp) 
637 struct mbuf *m; 

638 struct vif *vifp; 

























































































































































































































































































































































































































































































































































































639 { 
640 struct ip *ip = mtod(m, struct ip *); 
641 struct mbuf *mb_copy, *mb_opts; 
642 struct ip *ip_copy; 
‚643 int error; 
644 u char *cp; 
645 /* i 
646 * Make sure that adding the tunnel options won't exceed the 
647 * maximum allowed number of option bytes. 
648 */ 
649 if (ip-»ip hl > (60 - TUNNEL LEN) >> 2) ( 
650 mrtstat.mrts cant tunnel«*; 
651 return; 
652 } 
653 PE 
654 * Get a private copy of the IP header so that changes to some 
655 £ of the IP fields don't damage the original header, which is 
656 * examined later in ip input.c. 
657 */ 
658 mb copy = m_copy (m, IP HDR LEN, M_COPYALL); 
659 if (mb copy == NULL) 
660 return; 
661 MGETHDR (mb opts, M_DONTWAIT, MT_HEADER); 
662 if (mb_opts == NULL) { 
663 m freem(mb copy); 
664 return; 
665 } 
666 /* 
667 * Make mb opts be the new head of the packet chain. 
668 * Any options of the packet were left in the old packet chain head 
669 * 
670 mb_opts->m_next = mb_copy; 
671 mb_opts->m_len = IP_HDR_LEN + TUNNEL_LEN; 
672 mb_opts->m_data += MSIZE - mb_opts->m_len; 7 
B ip mroute.c 
D 14-43 tunnel send [0000000000 
1. 
635-652 IP tunnel_send 
2. mbuf 
653-672 m_copy 20(IP_HDR_LEN) mbu 
IP mb_opts MGETHDR 
mb_copy m_len|| m data 
IP 
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tunnel send 14-44 
- - ip mroute.c 
673 ip copy = mtod(mb opts, struct ip >); 
674 /* 
675 * Copy the base ip header to the new head mbuf. 
676 */ 
677 *ip copy = *ip; 
678 ip copy->ip ttl--; 
679 ip copy->ip dst = vifp-»v rmt addr; /* remote tunnel end-point */ 
680 £* 
681 * Adjust the ip header length to account for the tunnel options. 
682 */ 
683 ip copy->ip hl += TUNNEL LEN >> 2; 
684 ip copy->ip len += TUNNEL LEN; 
685 pt 
686 * Add the NOP and LSRR after the base ip header 
687 Sy 
688 cp = (u char *) (ip copy + 1); 
689 *cp++ = IPOPT_NOP; 
690 *cp++ = IPOPT_LSRR; 
691 *cp++ = 11; /* LSRR option length */ 
692 *cp++ = 8; /* LSSR pointer to second element */ 
693 *(u long *) cp = vifp->v lcl addr.s addr; /* local tunnel end-point */ 
694 cp += 4; 
695 *(u long +) cp = ip-»ip dst.s addr; /* destination group */ 
696 error = ip output (mb opts, NULL, NULL, IP FORWARDING, NULL); 
697 3 : 
ip mroute.c 
O 14-44 tunnel send 0000000000 
3. IP 
673-679 mbu IP mbu TTL 
4. 
680—664 ip hl[| ip len IP 
NOP LSRR LSRR (11 ) (8 
) (O 14-13) 
5. 
665-697 LSRR 
ip output 
14.9 [][] [| ip mrouter donell [|] 
mrouted DVMRP. DONE ip mrouter done (O 14-45) 
161-186 splnet 
SIOCDELMULTI ( 14.3) 
bzero viftable numvifs 0 
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187-198 
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bzero 






























































































































































































































































































































































oo mroute. 











































































































































































































































































































161 int 
162 ip mrouter done() 
163 { 
164 vifi t vifi; 
165 int i; 
166 struct ifnet *ifp; 
167 int 8; 
168 struct ifreq ifr; 
169 S = splnet(); 
170 /* 
171 * For each phyint in use, free its local group list and 
172 * disable promiscuous reception of all IP multicasts. 
173 */ 
174 for (vifi = 0; vifi < numvifs; vifi++) ( 
175 if (viftable[vifi].v lcl addr.s addr != 0 && 
176 !(viftable[vifi].v flags & VIFF TUNNEL)) ( 
177 if (viftable[vifi].v lcl grps) 
178 free(viftable[vifi].v lcl grps, M MRTABLE); 
179 satosin(&ifr.ifr addr)->sin family = AF INET; 
180 satosin(&ifr.ifr_addr)->sin_addr.s_addr = INADDR ANY; 
181 ifp = viftable[vifi] .v_ifp; 
182 (*ifp->if_ioctl) (ifp, SIOCDELMULTI, (caddr_t) & ifr); 
183 } 
184 } 
185 bzero((caddr t) viftable, sizeof (viftable)); 
186 numvifs - 0; 
187 /* 
188 * Free any multicast route entries. 
189 */ i 
190 for (i = 0; i < MRTHASHSIZ; i++) 
191 if (mrttable[i]) 
192 free(mrttable[i], M MRTABLE); 
193 bzero((caddr t) mrttable, sizeof(mrttable)); 
194 cached mrt - NULL; 
195 ip mrouter - NULL; 
196 splx(s); 
197 return (0); 
198 } , 
ip mroute.c 
O 14-45 ip mrouter done [| [| [| DVMRP_DONE UI 
14.10 OQ 
Net/3 
mrouted 
Net/3 
LSRR 
RPB[] TRPB[] RPM TRPB 
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U U 

14.1 QQ 14-250 0 ] 100000 

142 DO O spinet se1x0 0 00 1423000 000000000060 

143 000000 1P_ADD_MEMBERSHIP) D B U D B DU] HI U OD DO O 0 7I U DIO 
SIOCDELMULTI[| 000000 

14.4 [] U U U U U U 0000 ip mforward]J UU U U U U U 
U U U 000 DU ip outpt U U LU LI D UD LIO U D OE CE 0 0 0 LU DE U LI C] 
ip mforward ] 0000 

145 000000000000 000000 
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iS] D U H 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































151 OO 
Net/3 | | 1983 
4.2BSD | | | 
Net/3 4.3BSD Reno Unix 42 
1.7 
Unix I/O | U read[] write 0 BSD] [] 
( ) 
read|| write sendmsgl| recvmsg 
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O0O0O0000000000000000 











[Rago 1990] 
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15 
splnet[] | 
splnet[] splx|] [] 1.12[] 0 
ODO Uuuu JOD splnet[] | 
| i 
o 0 LU U U U 
15.2 [Ul 
| 15-2 
U [] 0 E 
sys/socketvar.h socket] O00 
kern/uipc_syscalls.c 000000 
kern/uipc socket.c 00000 






































0152 9000000000 














































































































socketps 


sysent 








struct fileop 


UO OOOO socket] 0 





struct sysedt| 00000000 








15.3 socket[] [] 


153 00000000 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































| U UU 
( ) 

15-5 LU 
41-42 so type uu U | 
so_type O U 7-8 pr_type UDP[] so type SOCK DGRAM| 
TCP[] so type SOCK STREAM 
43 so options | 15-4 

getsockopt|| setsockopt SO ACCEPTCONN 

DO! listen[] H 0 so AccerTcony[] | 
44 so linger] |] O 0 0 0 D I U ( L 
DIO 15.150 ) 
45 so state | 15-6| so state 
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— AM 


so_options D D DD U U 


SO_ACCEPTCONN . 
SO_BROADCAST 
SO_DEBUG 

SO_DONTROUTE 
SO_KEEPALIVE 























SO_OOBINLINE 00000000 
SO_REUSEADDR U D D D 
SO_REUSEPORT 0200000090 















































O00000000000000 


SO_USELOOPBACK 























O 15-4 so options [| [| 


socketvar.h 
41 struct socket { 
42 short so_type; /* generic type, Figure 7.8 */ 
43 short so_options; /* £rom socket call, Figure 15.5 */ 
44 short so_linger; /* time to linger while closing */ 
45 short so_state; /* internal state flags, Figure 15.6 */ 
46 caddr t so pcb; /* protocol control block */ 
47 Struct protosw *so proto; /* protocol handle */ 
48 /* 
49 * Variables for connection queueing. 
50 * Socket where accepts occur is so head in all subsidiary sockets. 
51 * If so head is 0, socket is not related to an accept. 
52 * For head socket so q0 queues partially completed connections, 
53 * while so q is a queue of connections ready to be accepted. 
54 * If a connection is aborted and it has so head set, then 
55 + it has to be pulled out of either so q0 or so 9. 
56 * We allow connections to queue up based on current queue lengths 
57 + and limit on number of queued connections for this socket. 
58 */ - 
59 struct socket *so_head; /* back pointer to accept socket */ 
60 struct socket *so_q0; /* queue of partial connections */ 
61 struct socket *so_q; /* queue of incoming connections */ 
62 short so_q0len; /* partials on so 9g0 */ 
63 short so glen; /* number of connections on so q */ 
64 short so glimit; /* max number queued connections */ 
65 short so_timeo; /* connection timeout */ 
66 u_short so_error; /* error affecting connection */ 
67 pid_t so_pgid; /* pgid for signals */ 
68 u_long so_oobmark; /* chars to oob mark */ 
69 /* 
70 * Variables for socket buffering. 
71 */ 
72 struct sockbuf ( 
73 u_long sb cc; /* actual chars in buffer */ 
74 u_long sb_hiwat; /* max actual char count */ 
75 u long sb mbcnt; /* chars of mbufs used */ 
76 u long sb mbmax; /* max chars of mbufs to use */ 
77 long sb lowat; /* low water mark */ 
78 struct mbuf *sb_mb; /* the mbuf chain */ 
79 struct selinfo sb sel; /* process selecting read/write */ 
80 short sb flags; /* Figure 16.5 */ 
81 short sb timeo; /* timeout for read/write */ 
82 ) so rcv, so snd; 
83 caddr t so tpcb; /* Wisc. protocol control block XXX */ 


O 15-5 struct sockdt[] 
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84 void (*so_upcall) (struct socket * so, caddr t arg, int waitf); 
85 caddr_t so_upcallarg; /* Arg for above */ 
86 ); i 
socketvar.h 
0155 (0) 
so_state 00000 U U 
SS_ASYNC D 0 0 D vo) D D 0000 
SS_NBIO 0020000000 
SS_CANTRCVMORE . 000000000000 
SS_CANTSENDMORE . 000000000000 
SS_ISCONFIRMING . 000000000000 
SS_ISCONNECTED . 0000000000 
SS_ISCONNECTING . 000000000000 
SS ISDISCONNECTING . 0200000000 
SS_NOFDREF . O00000000000 
SS_PRIV ° O0O000000000000000 
SS_RCVATMARK N O0O000000000000000000000000 
O 15-6 so state J [] 
15-6 fcntl[] ioct1]|]] 
SS ASYNC[] SS_NBIO | i i 
connect SS_ISCONNECTED 































































































































































































SS_NBIO|| SS_ASYNC 


























1/0 read | 






























































































































































read write 












































































































































| LU U 
SS NBIO[] 0 O volt] | l U U Up HO ET 
EWOULDBLOCK[] 















































































































































































































































SS ASYNC uil 
SIGIO so pgid | Ul 


































































































































































































































































































































































































































































































































































































so pcb 15-7 


































































































so_pcbl] | tcpcbl] 22-1 
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EET 

















[] [] 000 OOOO 
UDP struct inpcb 22.30 
TCP struct inpch 22.30 




















struct tcpch [ 24.5] 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ICMP[] IGMP[][][] IP | struct inpch 22.3[] 
Od struct rawch 20.30 
0157 DB ODD 
47 so proto Socket (U 7.40 ) protosw[] 
48—64 | SO ACCEPTCONN | | ( 
TCP ) So qO 
TCP ) so q so qO0len[] so_qlen 
So head 
SO ACCEPTCONN 
So qlimit listen 
so qlimit 5 (SOMAXCONN 15-24) 0 15-29 
So qlimit 
15-8 
socket () 













































































































socket () 
sene: 
| sog) > 00000 
| sog |= 
0 TOP SYND D 0 000 0 
000000 accept 00 socket {} 
O000000 
— 
65 so_timeo accept[| connet|[| close (wait channel 15.10 
) 
66 so_error 



















































































































































































































































































































































































































































































































































































































































































67 SS_ASYNC SIGIO ( so_pgid 0) 
( so_pgid 0) ioctl[] SIOCSPGRP[] SIOCGPGRP 
so pgid [Stevens 1992] 
68 so oobmark 16.11 
29.7 TCP 
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69-82 UUDUDUDUDUDUUUDUDU so rev] so snaf 000000000 U U 
so rev[] so sna) DU DH UD D OO D D 0 D 0 D D D D D D D D D D 0 UD 160 
100000000090 
83-86 Net/30 0 0 0 so. tpcb[] so. upcall[] so. upcallarg [| 0 O Net/3[] [] NFS 
NFS] [] [] L] U DU U U U U 000 UD D 0 0 U U U U U 
0 ut IBI so upcall[][][] NFS[] [| 00000 
O OO tsleep[] wakeup|] |] ODO NFS] 0 OOOOOOOO 
Q O socketvar.h[] uipc_socket2.c0 000000000000000 15-9 
U U U U U 0 0 0 U 
o U o U 
sosendallatonce sH D DUDUDU 0 gg 00D 0D 000000000000 
int sosendallatonce (struct socketso); 
soisconnecting IND DO OO OU so rscoNNECTING 
int soisconnecting (struct socket sd); 
soisconnected 000 15-30 
soreadable D8sd0D000000000000 
int soreadable (struct socket sé); 
sowriteable U 0 sol 0000000 D 000 U 
int sowriteable(struct socketso); 
socantsendmore 000000 so_cantsenpMoreg QO OO0000000000000 
int socantsendmore(struct socket so); 
socantrcvmore 000000 so_cAnTRcevmorE] 000000000000000 
int socantrcvmore (struct socketso); 
soisdisconnecting [] I] SS_ISCONNECTING[] U 000 ss ISDISCONG[] SS CANTRCVMORE 














U SS_CANTSENDMOREL D D D O0000000000 


int soisdisconnecting(struct socketso); 





U 





soisdisconnected 


[] [ SS. ISCONNECTING[] SS ISCONNECTED[] SS_ 
U 
O00000000e10seJ 0000 


int soisdisconnected(struct socket sd); 


NO DD ss CANTrCVvMORE[] SS_CANTSENDMORE] 0000000090 


ISDISCONNECTING 








soginsque 


Soqremque 





Net/IN 000000000000 


0004000s00 00 so->so_head] 000000 


int soqremque (struct socketso, int q); 





U sol O head] D DD D DDD D 40 D 00 D D D D DD D D D D 0 D D U 
so 40 000000 DD 000 DD DD DD 000 DD soal 00 0 


int soqinsque (struct socket + head, struct socket + 


so, int q); 








015-9 [000000 
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15.4 0000 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































U U U 
Net/3[] 386 
BSD 
386 
syscall syscall 
sysent sysent 
struct sysent 
int sy_narg; /* number of arguments */ 
int (*sy call) (); /* implementing function */ 
y; /* system call table entry */ 
sysent kern/init_sysent.c 
struct sysent sysent[] = { 
Re 
3, recvmsg }, /* 27 = recvmsg */ 
3, sendmsg }, /* 28 = sendmsg */ 
6, recvfrom ), /* 29 = recvfrom */ 
3, accept |, /* 30 = accept */ 
3, getpeername |), /* 31=getpeername */ 
3, getsockname |, /* 32 = getsockname */ 
Pl 
) 
OO recvmsg 270 0 
recvmsg]l] | | 
syscall 
syscall syscall 
386 
struct sysent *callp; 
error = (*callp->sy_call) (p, args, rval); 
callp sysent p 
args 32 bit rval 
32 bit u 
[| syscall 
syscall ([ sy call ) 0 
rval ( ) 
syscall rval 
errno -1 
errnol] |] 0 
386 (carry bit) syscall 
errno -1 
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syscall 
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syscall 








































































































syscall OO dl rvall] ) 











15.4.1 
































socket 





int socket (int domain, int Hype, int protocol); 





































































































socket 











struct socket_args 
int domain; 
int type; 
int protocol; 

i 

socket (struct proc *p, struct socket args *uap, int *retval); 































































































































































































































































































































































































































































































socket syscall 
32bit socket 
socket socket args 15-10 
00000000 


O000000 


å BR ———— ree 


socket_args{} 


[] 15-10 socket DO LJ O 


































































































socket | args 
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*retval[] syscall 0 
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U U 


socket 
bind 





o D 
O00000000 





listen 


accept 


100 
100 





connect 











read 
readv 
recv 
recvfrom 


recvmsg 


U 
O0O000000000000000000 





write 
writev 
send 
sendto 


sendmsg 


O0O000000000000000 





I/O 


select 


= 
I 
© 
Co 





shutdown 


close 








D D D U 











fcntl 

ioctl 
setsockopt 
getsockopt 
getsockname 


getpeername 





Š 


Ë 



































000 
000 



































write 
writev 
sendto 
sendmsg 





Net3Q 0000000 


read 
readv 
readfrom 
readmsg 


select 


0152 00000000 
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15-12 I/O 
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proc{} filedesc() *file{}[] 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































E fd ofiles 
filet) 
socketops: 
EN 
E 
protoswt) DE 
0 15-13 I000000000 
p proc 
proc proc p_fd filedesc 
fd_ofiles file 
file 
15-13 file p->p_fd->fd_ofiles[fd] 
file f_ops[] f£. dart all I/O ([] read 
write) 1/0 f ops fileops 
read[] write[] ioctl[] select[] close 15-13 
f ops fileops Socketops 
f data I/O f data 
Socket Socket So proto protosw 
protosw 
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15.6 socket| | [| [| [] 


socket 


China-pubecom 













































































domain 
































type 














protocol 







































































































































































































































































42 struct socket_args { 


43 
44 
45 
46 ); 


47 socket (p, 


int domain; 
int type; 
int protocol; 


uap, retval) 


48 struct proc *p; 
49 struct socket_args *uap; 


uipc_syscalls.c 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































50 int *retval; 
51 I 
52 struct filedesc *fdp = p-»p fd; 
53 struct socket *so; 
54 struct file *fp; 
55 int fd, error; 
56 if (error = falloc(p, &fp, &fd)) 
57 return (error); 
58 fp->f flag = FREAD | FWRITE; 
59 fp->f type = DTYPE_SOCKET; 
60 fp->f_ops = &socketops; 
61 if (error = socreate (uap->domain, &so, uap->type, uap->protocol)) { 
62 fdp->fd_ofiles[fd] = 0; 
63 ffree(fp); 
64 } else { 
65 fp->f data = (caddr t) so; 
66 *retval = fd; 
67 } 
68 return (error); 
69 } P 
uipc_syscalls.c 
O 15-14 socket [] [] O Ü 
42-55 
socket_args 
proc uap retval 
pl retval uap 
56-60 falloc file fd ofiles ([] 15-13) fp 
fd fd ofiles 
socket|| file fo read soo read 
fileops socketops fo write soo write 
i fo ioctl soo_ioctl 
f ops file socketops fo select | soo select 
15-15 fo close Soo close 
60-69 socreate socket D 15-15 socketops [JO 
socreate | | error file 000 files 00 
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Socreate f data Socket 






















































































































































































*retvall[] fd socket 0 


































































































socreate 




































































15.6.1 socreate 











































































































































































































































































































































































































































































































































































































socket|| socreate 
SOXXX 
NFS 
socreate 15-16 
: uipc_socket.c 
43 socreate(dom, aso, type, proto) 
44 int dom; 
45 struct socket **aso; 
46 int type; 
47 int proto; 
48 ( 
49 struct proc *p = curproc; /* XXX */ 
50 struct protosw *prp; 
51 struct socket *so; 
52 int error; 
53 if (proto) 
54 prp = pffindproto (dom, proto, type); 
55 else 
56 prp = pffindtype (dom, type); 
57 if (prp == 0 || prp-»pr usrreq == 0) 
58 return (EPROTONOSUPPORT) ; 
59 if (prp->pr_type != type) 
60 return (EPROTOTYPE) ; 
61 MALLOC (so, struct socket *, sizeof(*so), M SOCKET, M WAIT); 
62 bzero((caddr t) so, sizeof(*so)); 
63 So-»SO type = type; 
64 if (p-»p ucred-»cr uid -- 0) 
65 SOo-»SO state = SS PRIV; 
66 SO-»SO proto = prp; 
67 error - 
68 (*prp->pr usrreqd) (so, PRU ATTACH, 
69 (struct mbuf *) 0, (struct mbuf *) proto, (struct mbuf *) 0); 
70 if (error) ( 
71 So-»so state |= SS NOFDREF; 
72 sofree (so); 
73 return (error); 
74 ] 
75 *aso = so; 
76 return (0); 
77) 
uipc_socket.c 
0 15-16 socreate [ 0 
43-52 socreate dom ( PF INET)[] aso 
Socket type ( SOCK STREAM)[] proto 
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53-60 proto UU 0 pffindprotol| J] UU [] Ú OD protol]|[] 0] 
pffindtype[]l type U U D 0 U 0 0 0 UD U D D 0 U UD 0 U Ia UU 
U U U D protosw 00000000 GUO 7.60 XL] 

2000000 socket] |] 
61-66 socreatel| [| [| LU UU socket U U U U U U 100 00000 type O O 
U U UD 000 D 00 D DD 0 DD ss PRIVI OO 

3. PRU ATTACH[] 
67-69 UU UU U U U U DD 0 00000000 socreatel) J] 
0000 7.40 | 15-13 so->so proto->pr usrreq Do ID so 







































































































































































00000 U U 0 00 00 U 000000 U U U 




















int pr usrreq(struct socket *so, int req, struct mbuf *mo, xml, *m2); 


U U U U U U 00 0 U UD UD U U U rel U 0 0 0 D UD D D D D «nor 
mi m2) D] U D 0 U D 0 Í mbuf [] D D ODO DO D D D BE 0 0 ] 























































































































































































































































































































a 
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EN U U U 


a 
a 
E 
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[| 15-170 [| 0 pr_usrreq[] 




















































































































PRU_ABORT OOO000000000 
PRU ACCEPT address U D 8 B D D U 

PRU ATTACH protocol 0200000000 
PRU_BIND address 0000000 

PRU CONNECT address 0000000000 
PRU_CONNECT2 socket2 0000000090 
PRU_DETACH D DDD 
PRU_DISCONNECT OOO0000000000 
PRU LISTEN D 0 000000 
PRU_PEERADDR buffer 000000000000 
PRU_RCVD flags O0OO000000 

PRU RCVOOB buffer flags OO OOB[I O 

PRU SEND data address control 000000 
PRU_SENDOOB data address control OO 00B[ O 
PRU_SHUTDOWN 0000000000 
PRU_SOCKADDR buffer 000000000000 





O 15-17 pr usrreg UI 


























PRU CONNECT2J] JO OD Unix) 0 D 0 D 0 D EE 0 D 0 EE EE D EE DT D U 
Unix] I I ere) 000 l U U U U U U (U 
40000 

70-77 [| [| socreatel] | 

















































































































U U UU PRu ATTACHII D LH D 0 U 





U DU D 00000 U 
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| TCP[] UDP 
| 
15.6.2 
15-18 | | 
- (0000 = 
[] [] [] U 000 
OM | 00 
in control N O0O00000000000000 [] 6-14 
in control . 000000 [] 6-22 
in_pcbbind . 0000000 1024 Internet] D [] 22-22 
ifioctl . 000000 [] 4-29 
ifioctl ° OQ0000 (1000000) [] 12-11 
rip_usrreq . 0000 ICMP[] IGMPI OO PO O [] 32-10 
slopen . OOOsSserPO D D D D 000000 |05-9 
0 15-18 Ne/3] 0000000 
LI ioctl1[][] (SIOCADDMULTI SIOCDELMULTI) [| IP ADD 
MEMBERSHIP[] IP DROP MEMBERSHIP [] 0 E 
15-18 “ ” “ ” 
( 
0 15.1)0 [| Neu? suser | L| U 
SS_PRIV] i | 
rip_usrreq| socreate SS_PRIV 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































getsock 
sockargs mbu 
[ LU UU U 
15-19 getsock 0 
754-767 getsock fdp fdes fdp filedesc 
getsock[] [] fpp 0 
15-20 sockargs 
768-783 15-4 sockargs 
| 
0 0 0 [| sockargs 0 
mbu sockargs[] bind 
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mbuf 
754 getsock (fdp, fdes, fpp) uipc_syscalls.c 
755 struct filedesc *fdp; 
756 int fdes; 
757 struct file **fpp; 
758 ( 
759 struct file *£p; 
760 if ((unsigned) fdes >= fdp->fd_nfiles | 
761 (fp = fdp->fd_ofiles[fdes]) == NULL) 
762 return (EBADF); 
763 if (fp->f type != DTYPE SOCKET) 
764 return (ENOTSOCK) ; 
765 *fpp = fp; 
766 return (0); 
767 } 





uipc_syscalls.c 
[] 15-19 getsock [] [] 





uipc_syscalls.c 
768 sockargs (mp, buf, buflen, type) 


769 struct mbuf **mp; 
770 caddr_t buf; 




















































































































































































































































































































































































































































































































































































































771 int buflen, type; 
772 1 
773 struct sockaddr *sa; 
774 struct mbuf *m; 
775 int error; 
776 if ((u_int) buflen > MLEN) ( 
777 return (EINVAL); 
778 } 
779 m = m_get (M_WAIT, type); 
780 if (m == NULL) 
781 return (ENOBUFS); 
782 .m->m_ Jen = buflen; 
783 error = copyin(buf, mtod(m, caddr_t), (u_int) buflen); 
784 if (error) 
785 (void) m_free(m); 
786 else { 
787 *mp = m; 
788 if (type == MT SONAME) { 
789 sa = mtod(m, struct sockaddr *); 
790 sa->sa len = buflen; 
791 ) 
792 ) 
793 return (error); 
794 3 š i 
‘uipc_syscalls.c 
O 15-20 sockargs [] [J 
mbuf mbu sockargs EINVAL[| ENOBUFS 
mbuf mbuf[] copyin 
mbu copyin EACCES 
784-785 mbuf| mp 
mbu sockargs 0 
786-794 type MT_SONAME sockaddr sockargs 
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sa len 





































































































































































































Net/3 pre-4.3BSD Reno 
sockaddr sa_len 15-20 


























































































































































































































15.8 bind] D U 





bind 





















































































































































bind 




























































































































































































(TCP) 




























































































(UDP) bind 


























































































































































































































connect (sendto[] sendmsg) 









































15-21 bind 





















































uipc_syscalls.c 
70 struct bind_args { 


71 int Ss; 

72 caddr_t name; 

73 int namelen; 
74 ); 


75 bind(p, uap, retval) 
76 struct proc *p; 

77 struct bind args *uap; 
78 int *retval; 

79 ( 

80 struct file *fp; 
81 struct mbuf “nam; 
82 int error; 


83 if (error = getsock(p-»p fd, uap-»s, &fp)) 

84 return (error); : 

85 if (error = sockargs(&nam, uap-»name, uap-»namelen, MT SONAME)) 
86 return (error); 

87 error = sobind((struct socket *) fp->f data, nam); 

88 m freem(nam); 

89 return (error); 

90 ) 





uipc syscalls.c 
H 15-21 bina O 








70-82 bind (| bind args JU s name 






















































































































































































( sockaddr in ) namelen 



















































































83-90 getsock file sockargs mbuf sobind 



















































































bind sobind mbu 
































S socket file 


























































































































socket 































































































































































































































































































mbu 
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TCP/IP 2 
mbu mbuf| 
bind retval 15.4 
syscall retval[] 0 0 
retval 
sobind 
15-22 sobind PRU_BIND 

























































































































































































uipc_socket.c 


78 sobind(so, nam) 
79 struct socket *so; 
80 struct mbuf *nam; 











81 I 
82 int s = splnet(); 
83 int error; 
84 error = 
85 (*so->so_proto->pr_usrreq) (so, PRU BIND, 
86 (struct mbuf *) 0, nam, (struct mbuf *) 0); 
87 splx(s); 
88 return (error); 
89 } d 
uipc_socket.c 
U 15-22 sobind [] [] 
78-89 sobind PRU_BIND nam 























































































































































































































15.9 listen] ||] [| 

































































































































































































































































































































































































































































































































































listen | 15-23 
TCP 
accept ([] 15.11[] ) 
91 struct listen_args { HIDE alle 
92 int 8; 
93 int backlog; 
94 ); 
95 listen(p, uap, retval) 
96 struct proc *p; 
97 struct listen args *uap; 
98 int *retval; 
99 ( 
100 struct file *fp; 
101 int error; 
102 if (error = getsock(p-»p fd, uap-»s, &fp)) 
103 return (error); 
104 return (solisten((struct socket *) fp->f data, uap->backlog)); 
105 ) 





uipc_syscalls.c 


0 15-23 listen [1 000 
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91-98 listen 







































































































































































































































































































































































































































































































































































































































































































































































99-105 getsock s|] file solisten 
solisten 
solisten PRU_LISTEN 15-24 
90-109 solisten PRU LISTEN pr usrreg | 
pr usrreq SS ACCEPTCONN 
so qlimit[] Neu? 0 
S(SOMAXCONN) 
- uipc socket.c 
90 solisten(so, backlog) 
91 struct socket *so; 
92 int backlog; 
93 1 
94 int s = splnet(), error; 
95 error = 
96 (*so->so_proto->pr_usrreg) (so, PRU LISTEN, 
97 (struct mbuf *) 0, (struct mbuf *) 0, (struct mbuf *) 0); 
98 if (error) { 
99 splx(s); 
100 return (error); 
101 } 
102 if (so->so_q == 0) 
103 so->so_options |= SO_ACCEPTCONN; 
104 if (backlog < 0) 
105 backlog = 0; 
106 so->so_qlimit = min(backlog, SOMAXCONN) ; 
107 splx(s); 
108 return (0); 
109 } 


uipc_socket.c 


O 15-24 solisten [] Ü 


15.10 tsleep[] wakeup|| | 


























































































































































































































































































































































































































































































































tsleep 
tsleep 
int tsleep(caddr t chan, int pri, char *mesg, int timeo); 
tsleep chan 
wakeup 
wakeup 





































































































void wakeup(caddr t chan); 




































































































































































tsleep 


























































































































tsleep pri | pri 





































































































tsleep pri PCATCH 




































































































































































































































































tsleep mesg tsleep ps 
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timeo 
15-25 tsleep 
wakeup 
tsleep 
tsleep 
tsleep () [] U 

U 00000000 wakeupl O 

EWOULDBLOCK | 00000 meo 0000000000 wakeupl 000000 

ERESTART O000000000000000000000000 

EINTR O000000000000000000000 

H 15-25 tsleep J 000 
wakeup 
[Leffler et al. 1989] 
UDP 
recvfrom tsleep 
wakeup 
tsleep 
TCP 
accept [Comer and Stevens 1993] 
15.11 accept 000 
listen accept accept 
s 
name accept 
TCP ( 
) OSI[] TP4 
tsleep 
15-26 accept 
























































106 
107 
108 
109 
110 


111 
112 
113 
114 


struct accept_args ( 
int s; 
caddr_t name; 
int *anamelen; 
); 


accept (p, uap, retval) 
struct proc *p; 

struct accept_args *uap; 
int *retval; 


D 15-26 accept D U D 


uipc_syscalls.c 
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115 ( 

116 struct file *fp; 

117 struct mbuf *nam; 

118 int namelen, error, s; 

119 struct socket *so; 

120 if (uap-»name && (error - copyin((caddr t) uap-»anamelen, 
121 (caddr t) & namelen, sizeof(namelen)))) 
122 return (error); 

123 if (error - getsock(p-»p fd, uap-»s, &fp)) 

124 return (error); 

125 S = splnet(); 

126 so = (struct socket *) fp->f_data; 

127 if ((so->so_options & SO_ACCEPTCONN) == 0) { 

128 splx(s); 

129 return (EINVAL); 

130 ) 

131 if ((so-»so state & SS NBIO) && so->so_qlen == 0) { 
132 spix(s); 

133 return (EWOULDBLOCK); 

134 } 

135 while (so->so_qlen == 0 && so->so_error == 0) í 
136 if (so->so_state & SS CANTRCVMORE) { 

137 SO-»SO error = ECONNABORTED; 

138 break; 

139 ) 

140 if (error = tsleep((caddr t) & so-»so timeo, PSOCK | PCATCH, 
141 netcon, 0)) ( 

142 splx(s); 

143 return (error); 

144 } 

145 } 

146 if (so->so error) { 

147 error = so->so_error; 

148 so->so_error = 0; 

149 splx(s); 

150 return (error); 

151 ) 

152 if (error = falloc(p, &fp, retval)) { 

153 splx(s); 

154 return (error); 

155 } 

156 { struct socket “aso = so->so_q; 

157 if (sogremque(aso, 1) == 0) 

158 panic ("accept"); 

159 so = aso; 

160 } 

161 fp->f type = DTYPE_SOCKET; 

162 fp->f flag = FREAD | FWRITE; 

163 fp->f ops = &socketops; 

164 fp->f data = (caddr t) so; 

165 nam = m get (M WAIT, MT SONAME) ; 

166 (void) soaccept(so, nam); 

167 if (uap-»name) ( 

168 if (namelen > nam->m len) 

169 namelen = nam->m len; 

170 /* SHOULD COPY OUT A CHAIN HERE */ 

171 if ((error = copyout (mtod (nam, caddr t), (caddr t) uap->name, 
172 (u int) namelen)) == 0) 


U 15-26 (0) 
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173 error = copyout((caddr t) & namelen, 
174 (caddr t) uap->anamelen, sizeof (*uap->anamelen)); 
175 } 
176 m_freem(nam); 
177 splx(s); 
178 return (error); 
179 } 
uipc_syscalls.c 
[] 15-26 (D) 
106-114 accept S name accept 
anamelen 
1. 
116-134 accept] |] (*anamelen) namelen[] getsock file 
( listen) I/O 
EINVAL|| EWOULDBLOCK 
2. 
135-145 while 
(tsleep EINTR)[] accept 
sonewconn 
tsleep tsleep 0 tsleep 
accept EINTR[] EWOULDBLOCK([] 15-25) 
3. 
146-151 accept 
accept 
So error 
| 
so error 
4. 
152-164 falloc Soqremque 
file 15.4 panic 
2 
167-179 accept mbu soaccept 
15.12 
copyout nam|| namelen 
copyout mbu 
accept 
mbu mbu Unix 
( 1023 ) Internet 
16 sockaddr_in 170 
mbuf | 
soaccept 

































































soaccept | | 




































































| | U 15-27 
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uipc_socket.c 
184 soaccept (so, nam) 
185 struct socket *so; 
186 struct mbuf *nam; 
187 ( 
188 int s = splnet(); 
189 int error; 
190 if ((so->so_state & SS_NOFDREF) == 0) 
191 panic ("soaccept: !NOFDREF"); 
192 so->so_state &- ~SS_NOFDREF; 
193 error = (*so->so proto-»pr usrreq) (so, PRU ACCEPT, 
194 (struct mbuf +) 0, nam, (struct mbuf +) 0); 
195 spix(s); 
196 return (error); 
197 ) 
uipc_socket.c 
O 15-27 soaccept [O JJ 
184-197 soaccept PRU_ACCEPT|| || 













































































































































































nam | 























pr_usrreg 





15.12 sonewconn[| soisconnected|] |] 



































EZ 


























































































































so g 





| 15-26 accept 
15-28 TCP 













































































































Å 
4. 







Socket() 


000000 







soisconnected 


sonewconn 





0 D SYND ACK 


D D ACK 
O O 0 TCPSYN TCP] OD D D DD Ack 


O 1528 DD DD D TCPO D 
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A e H 

















































































































































































































































































































































































































































































































































































































































































































































































































15-28 accept tsleep tcp_input 
sonewconn TCP SYN([] 28-7)[] sonewconn 
so q0 
TCP ACK tcp input soisconnected(|] 29-2) 
so q0 SO q accept 
15-26 tsleep accept[] so o 
PRU ATTACH accept 
15-29 sonewconn 





uipc_socket2.c 
123 struct socket * Pr 


124 sonewconn (head, connstatus) 
125 struct socket *head; 
































































































































































































































126 int connstatus; 
127 I 
128 struct socket *so; 
129 int soqueue = connstatus ? 1 : 0; 
130 if (head->so_qlen + head->so q0len > 3 + head-»so qlimit / 2) 
131 return ((struct socket *) 0); 
132 MALLOC(so, struct socket *, sizeof(*so), M SOCKET, M DONTWAIT); 
133 if (so == NULL) 
134 return ((struct socket *) 0); 
135 bzero((caddr t) so, sizeof(*so)); 
136 so->so_type = head-»so type; 
137 So-»So options = head->so options & ^SO ACCEPTCONN; 
138 so->so_linger = head-»so linger; 
139 so->so_state = head->so state | SS NOFDREF; 
140 SOo-»80 proto = head-»so proto; 
141 so->so_timeo = head-»so timeo; 
142 so->so_pgid = head-»so pgid; 
143 (void) soreserve(so, head->so snd.sb hiwat, head->so rcv.sb hiwat); 
144 Soginsque(head, so, soqueue); 
145 if ((*so->so proto->pr usrreq) (so, PRU ATTACH, 
146 (struct mbuf *) 0, (struct mbuf *) 0, (struct mbuf *) 0)) I 
147 (void) soqremque (so, soqueue); 
148 (void) free((caddr t) so, M SOCKET); 
149 return ((struct socket *) 0); 
150 ) 
151 if (connstatus) ( 
152 sorwakeup (head); 
153 wakeup((caddr t) & head->so_timeo); 
154 so->so_state |= connstatus; 
155 } 
156 return (so); 
157 3 
uipc socket2.c 
O 15-29 sonewconn [00 
123-129 head( )[] connstatus( 
) sonewconn TCP connstatus 0 
TP4[] connstatus SS_ISCONFIRMING 
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1. 
130=131 sonewconn 
P 3xso_qlimit 
e a — 
listen(fd, 0 1 18-23 
2. 
132-143 socket 
setsockopt socket so_options 
so lingerl| so_pgid|| sb hiwat socket| 
3. 
144 129 connstatus Soqueue soqueuel] 0 ( 
TCP ) so qO connstatus 0 SO q 
( TP4 ) 
4. 
145-150 PRU_ATTACH 
sonewconn 
5. 
151-157 connstatus 0 accept 
connstatus[]| so state TCP 
TCP connstatus 0 
so go 
soisconnected TCP TCP SYN 
15-30[] soisconnected 
78 soisconnected(so) | Juipc_socket2.c 
79 struct socket *so; 
80 I 
81 struct socket *head = so->so head; 
82 so->so_state &= "(SS ISCONNECTING | SS ISDISCONNECTING | SS ISCONFIRMING); 
83 so->so_state |= SS ISCONNECTED; 
84 if (head && sogremque(so, 0)) ( 
85 soginsque (head, so, 1); 
86 sorwakeup (head); 
87 wakeup((caddr t) & head->so_timeo) ; 
88 } else { 
89 wakeup ( (caddr_t) & so->so_timeo); 
90 sorwakeup (so); 
91 sowwakeup (so) ; 
92 } 
93 ) " 
kern/uipc_socket2.c 
O 15-30 soisconnected {J [J 
6. 
78-87 | soisconnected 
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( accept) head 
soqremque 1 so_q sorwakeup select 
accept 
wakeup tsleep 
7. 

88-93 head Soqremque connect 

head soqremque 0 so_q 
TP4 TP4 
so_q wakeup connect sorwakeup|| sowwakeup 
select 




























































































15.13 connect|| [| LI [] 






































listen|| accept 
































































































































































































































































































































































































































































































































( ) connect 
TCP[] connect 
bind 
UDP[] ICMP[] connect 
15-31 UDP[] TCP connect 


























































































PRU CONNECT 
PRU CONNECT [] [] = D 


TCP] OOO 
O 15-31 connect JO D Ú 
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connect UDP 
soisconnected|| connect 

connect TCP 

soisconnecting 
soconnect tsleep TCP 
soisconnected wakeup 
connect 

15-32 connect 
















































































uipc_syscalls.c 





180 struct connect_args { 


181 int s; 

182 caddr_t name; 
183 int namelen; 
184 ); 


185 connect (p, uap, retval) 
186 struct proc *p; 
187 struct connect_args *uap; 


188 int *retval; 

189 { 

190 struct file *£p; 

191 struct socket *so; 

192 struct mbuf *nam; 

193 int error, s; 

194 if (error = getsock(p-»p fd, uap-»s, &fp)) 

195 return (error); 

196 so = (struct socket *) fp->f data; 

197 if ((so->so state & SS NBIO) && (so-»so state & SS ISCONNECTING)) 
198 return (EALREADY); 

199 if (error - sockargs(&nam, uap-»name, uap-»namelen, MT SONAME)) 
200 return (error); 

201 error - soconnect(so, nam); 

202 if (error) 

203 goto bad; 

204 if ((so-»so state & SS NBIO) && (so-»so state & SS ISCONNECTING)) ( 
205 m freem(nam); | 

206 return (EINPROGRESS); 

207 ) 

208 s = splnet(); 

209 while ((so->so_state & SS ISCONNECTING) && so-»so error == 0) 
210 if (error = tsleep((caddr t) & so-»so timeo, PSOCK | PCATCH, 
211 netcon, 0)) 

212 break; 

213 if (error == 0) ( 

214 error = so->so error; 

215 SO-»SO error = 0; 

216 } 

217 splx(s); 

218 bad: 

219 so->so_state &= ~SS_ISCONNECTING; 

220 m_freem(nam) ; 

221 if (error == ERESTART) 

222 error = EINTR; 

223 return (error); 

224 } 





uipc_syscalls.c 
DH 15-32 comet 0000 
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180-188 connect (| connect args ) s name 
namelen 
189-200 getsock file 
EALREADY sockargs 

1. 
201-208 soconnect soconnect connect 

bad soconnect 1/0 
EINPROGRESS 

connect 
EALREADY soconnect EISCONN 

2. 

208-217 while splnet connect 
tsleep wakeup error OL] tsleep 
218-224 SS_ISCONNECTING 
mbuf| 




























































































15.13.1 soconnect 





















































soconnect 
























































































































































































































































































































































( TCP) UDP 






















































































uipc_socket.c 
198 soconnect (so, nam) 


199 struct socket *so; 
200 struct mbuf *nam; 


201 I 

202 int S; 

203 int error; 

204 if (so->so options £ SO_ACCEPTCONN) 

205 return (EOPNOTSUPP); 

206 S - splnet(); 

207 qe 

208 * If protocol is connection-based, can only connect once. 
209 * Otherwise, if connected, try to disconnect first. 

210 * This allows user to disconnect by connecting to, e.g., 
211 * a null address. 

212 */ 

213 if (so->so_state £ (SS_ISCONNECTED | SS_ISCONNECTING) && 
214 ((so->so_proto->pr_flags & PR_CONNREQUIRED) || 

215 (error = sodisconnect (so)))) 

216 error = EISCONN; 

217 else 

218 error = (*so-»so proto-»pr usrreqd) (so, PRU CONNECT, 
219 (struct mbuf *) 0, nam, (struct mbuf *) 0); 
220 splx(s); 

221 return (error); 

222 } 





uipc_socket.c 
O 15-33 soconnect T JJ 
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15-33 soconnect 
198-222 soconnect EOPNOTSUPP 
listen | 
EISCONN 

sodisconnect 

PRU CONNECT 
15132 

connect name 
0 sodisconnect 
PRU_CONNECT EAFNOSUPPORT 

EADDRNOTAVAIL 






























































































































































































































































































































































15.14 shutdown [| J Ú 


shutdown 15-34 








shutdown shutdown 































































































































































































































































































































































































shutdown TCP 



























































FIN TCP ( 1 18.5] ) 

























































































close shutdown 













































































































































































close close 



























































































































































550 
551 
552 
553 


554 
555 
556 
557 
558 
559 
560 


561 
562 
563 
564 


uipc_syscalls.c 


struct shutdown_args { 
int s; 
int how; 

m 


shutdown(p, uap, retval) 
struct proc *p; 
struct shutdown args *uap; 
int *retval; 
{ 

struct file *fp; 

int error; 


if (error = getsock (p->p_fd, uap->s, &fp)) 
return (error); 
return (soshutdown((struct socket +) fp->f data, uap->how)); 
} 


— ————OnP  "-*7 — vV[Sx—-ulipc_suscalls.c 


0 15-34 shutdown [] OOO 














































































































550-557 shutdown_args si [| how | 15- 


35 













































































how[] how++( 15-36 ) | | 



































376 






































China-bubcom 






















































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
how how++ O O 
0 FREAD 00000000 
FWRITE 00000000 
2 FREAD|FWRITE | 000000000 
[] 15-35 shutdown 000000 
how FREAD|| FWRITE 
558-564 shutdown soshutdown (wrapper function) getsock 
soshutdown 
soshutdown| | sorflush 
sorflush 
PRU_SHUTDOWN soshutdown 15-36 
uipc_socket.c 


720 soshutdown (so, how) 
721 struct socket *so; 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































722 int how; 

723 I 

724 struct protosw *pr = so->so_proto; 

725 howrt; 

726 if (how & FREAD) 

727 sorflush(so); 

728 if (how & FWRITE) 

729 return ((*pr->pr usrreq) (so, PRU, SHUTDOWN, 

730 (struct mbuf *) 0, (struct mbuf *) 0, (struct mbuf *) 0)); 

731 return (0); 

732 ] ` 

uipc_socket.c 
O 15-36 soshutdom [] J] 

720-732 sorflush 

( 15-37 ) PRU_SHUTDOWN 
733-747 SB_NOINTR 
sblock splimp 

socantrcvmore sockbuf asb 
splx asb bzero sockbuf 
mbuf 

748-751 shutdown 

| sockbuf sb_mb mbu 

| [| dom dispose 
Unix 
dom_dispose 
Unix 
[Stevens 1990][] [Leffler et al. 1989] 
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uipc_socket.c 
733 sorflush (so) 


734 struct socket *so; 




























































































































































































































































































































































































































































































































































































































































































































































































































































































735 I 
736 struct sockbuf *sb = &so-»so rcv; 
737 struct protosw *pr = so->so_proto; 
738 int S; 
739 struct sockbuf asb; 
740 sb->sb flags |= SB NOINTR; 
741 (void) sblock(sb, M WAITOK); 
742 S = splimp(); 
743 socantrcvmore (so); 
744 sbunlock (sb) ; 
745 asb = *sb; 
746 bzero((caddr_t) sb, sizeof(*sb)); 
747 Spix(s); 
748 if (pr-»pr flags & PR RIGHTS && pr-»pr domain->dom dispose) 
749 (*pr-»pr domain-»dom dispose) (asb.sb mb); 
750 sbrelease (&asb) ; 
751 T . 
uipc_socket.c 
[| 15-37 sorflush Jj] [| 
sbrelease mbuf shutdown 
(O E] 15.6) 
PRU_SHUTDOWN TCP PRU_SHUTDOWN 
FIN TCP 
15.15 closel] [| [| Li 
close fd 
close 
error = (*fp->f_ops->fo_close) (fp,p); 
15-13 fp->f£_ops->fo_closel] soo close 
15.15.1 soo close 
soo close soclose 15-38 
sys socket.c 
152 soo close(fp, p) 
153 struct file *fp; 
154 struct proc *p; 
155 { 
156 int error = 0; 
157 ‚if (fp->f data) 
158 error = soclose((struct socket *) fp->f data); 
159 fp->f data = 0; 
160 return (error); 
E d sys socket.c 





O 15-38 soo close 00 
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152-161 socket file soclose f data 

























































































15.15.2 soclose 




































































































































































































































































































































































soclose ( ) 
soclose 15-39 

130 struct socket *so; 

131 I 

132 int s = splnet(); /* conservative */ 

133 int error = 0; ` 

134 if (so->so options & SO_ACCEPTCONN) { 

135 while (so-»so, q0) 

136 (void) soabort (so->so_q0); 

137 while (so->so_q) 

138 (void) soabort (so->so_q); 

139 } 

140 if (so->so_pcb == 0) 

141 goto discard; 

142 if (so->so_state & SS_ISCONNECTED) { 

143 if ((so->so_state & SS_ISDISCONNECTING) == 0) { 

144 error = sodisconnect (so); 

145 if (error) 

146 goto drop; 

147 } 

148 if (so->so_options & SO_LINGER) { 

149 if ((so->so_state & SS_ISDISCONNECTING) && 

150 (so->so state & SS_NBIO)) 

151 ‘goto drop; 

152 while (so->so_state & SS_ISCONNECTED) 

153 if (error = tsleep((caddr_t) & so->so_timeo, 
154 PSOCK | PCATCH, netcls, so->so_linger) ) 
155 break; 

156 } 

157 } 

158 drop: 

159 if (so->so_pcb) { 

160 int . error2 = 

161 (*so->so_proto->pr_usrreg) (so, PRU_DETACH, : 
162 (struct mbuf *) 0, (struct mbuf *) 0, (struct mbuf *) 0); 
163 if (error -- 0) 

164 error - error2; 

165 } 

166 discard: 

167 if (so->so_state & SS NOFDREF) 

168 panic("soclose: NOFDREF"); 

169 so->so_state |= SS_NOFDREF; 

170 sofree (so); 

171 splx(s); 

172 return (error); 

173 } 





uipc_socket.c 


[] 15-39 soclose [ 0 








China=pupecom R 379 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































1. 
129-141 soclose soabort 
soclose discard 
soabort PRU_ABORT 
soabort[] [] 23-38 30-7[] UDP[] TCP PRU_ABORTI] 
2. 
142-157 drop 
sodisconnect 
SO_LINGER soclose 
soclose drop 
SO_LINGER soclose 
while (so_linger) 
oL tsleep[] ( ) 
3. 
158-173 PRU DETACH 
sofree 
sofree 15-40 






























































uipc, socket.c ' 
110 sofree(so) 


111 struct socket *so; 



















































































































































































































































































































































































































































































112 ( : 
113 if (so-»so pcb || (so->so state & SS NOFDREF) == 0) 
114 return; 
115 if (so-»so head) ( 
116 if (!sogremque (so, 0) && !soqremque(so, 1)) 
117 panic("sofree dq"); 
118 So-»so head - 0; 
119 } 
120 sbrelease (&so->so_snd); 
121 sorflush (so); 
122 FREE (so, M_SOCKET); 
123 } : 
uipc_socket.c 
[] 15-40 sofree [] [] 
4. 
110-114 sofree 
5. 
115-119 (so head ) 
panic so_head 
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2 
120-123 sorelease[|[]HTU0UU | sorflush | | tl U 
l U U i 
1918. TID 
pr_usrreq[] 
Internet 0 
U U 
15.1 7 
15.2 0 accept[] sockaddrl|] [| 0 
? 
15.3 IPv6 [| accept[] recvfroml[] 128 bit[] IPv6[]  [] 
ogu 0 mbu 
accept[] recvfrom mbu 
[] mbu EN mbu mbuf[] [] 
? 
15.4 15-26 soqremque panic? 
15.5 sorflush ? 
15.6 [| sorflush]|] |] 0 20 0 
LU 16 LU 

























































































Dik dek 


U 160 


U l 


I/O 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































16.1 [| [| 
OOO000000000| l U U I U U D U 0 0 (U 
nnnnn D) [] write[] writev[] sendto[] sendmsg[] 
read|| readv|| recvfrom|| recvmsg 
ID select select | | (| ) 
uuu 0 sosend[] soreceivel] |] 0 0 
0 vo] [] Ü O O0 U U 0 
O UU Vo] 
16.2 0000 
016100000 C 
00 0 [] 
sys/socket.h D D APOOOOOOOD 
sys/socketvar.h socket] 00000 
sys/uio.h uio JO Ú 
kern/uipc_syscalls.c socket[] [] 
kern/uipc_socket.c DU U D D 
kern/sys_generic.c select] 0 Ú Ú 
kern/sys socket.c select 020000 
U 161 JIOOGO0000 G D D 
620 U U U U U U U 0 U UD D U UU select U U DD U U U i OU 
U U (000 U [] 
selwait int select 000000 
nselcoll int OM select 0200000000 
sb max u long | I00000000000000 
U 16-2 00000000 
163 0000 
D 15.30 | 0 0 i OOO U U U D 0 
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TCP/IP 2 
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sockbuf 16-3 sockbuf ( 15-5) 
socketvar.h 

72 struct sockbuf { 

73 u long sb cc; /* actual chars in buffer */ 

74 u long sb hiwat; /* max actual char count */ 

75 u long sb mbcnt; /* chars of mbufs used */ 

76 u long sb mbmax; /* max chars of mbufs to use */ 

77 long sb lowat; /* low water mark */ 

78 struct mbuf *sb_mb; /* the mbuf chain */ 

79 struct selinfo sb sel; /* process selecting read/write */ 

80 short sb flags; /* Figure 16.5 */ 

81 short sb timeo; /* timeout for read/write */ 

82 ) so rcv, so snd; 

socketvar.h 
O 16-3 sockbuf [] [] 
72-78 mbu sb mb mbuf 
mbuf[] sb. cc | mbu sb hiwat[] sb lowat 
sb mbcnt | mbu | | 
mbuf 0-2048 ( 
sb_mbmax mbu socket 
PRU_ATTACH 262,144 
16-4 Internet! 






















































































0 16-4 Internet] 00000000000 























































































































































































































UDP UDP sb_hiwat 
40[] IK sockaddr_in ( 16 ) 
79 sb_sel select selinfo (16.13[] ) 
80 16-5 sb_flags 
sb-flags U O 
SB_LOCK U DD 00 DD 000 D 0 U 
SB WANT O00000000000000 
SB WAIT U U U U U 0 U 0 U 0 U 0 U 0 U 00 0 U 0 U U 
SB SEL U D D 0 0 DU00000000 U 
SB ASYNC 42000000 vop O 
SB_NOINTR U U U U U 0 U 0 L 
SB NOTIFY (SB WAIT|SB AEL|SB ASYNC) 
OOO000000000000000000000000 wakeuel D D D Ú 













































































































































































































































































O 16-5 sb flags J JJ 
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81-82 sb timeol DU D D 0 D 0 0 0 0 D 0 0 D D D 0 D D D D D D D D D U (tick 
U U 0 0 00 0 D 0 0 000 DU UU SO_SNDTIMEOL so RGVYTTMEOÙ D D U D 0 D 


[| sb timeo[l [] [] 

























































































U DU D D 0 000 00 D 00 D 0 0 D 0 0 D 0 D 1660000000000000 









































U [] Oo O 
sblock U D D sbD D D D 0 wi 0 mwarrok0 00000000000000000000 
00000000 EwouLpBLockD D D D D DD DDD DOD DDD ErNTRI 
ERESTART 00000 

int sblock (struct sockbuf *sb, iwf); 
sbunlock OOO0s0000000000s000000000 
void sbunlock (struct sockbufsby U 
sbwait OO tsieepf D ss D 0000000 tsieepl D D 0 0 
int sbwait (struct sockbufsh [] 
NDODODODDDODDDDDDDDDDDOND sbwait D U D D sø] UD tsleepl] 
OG 
void sowakeup (struct socketsb, struct sockbufsb[] 
sorwakeup D DDD sp D DDD DDD DD DDD D 0 roppo000000 00000000 
D sıcıo] 0 











sowakeup 














void sorwakeup (struct socket sh [] 


sowwakeup O000s00000000000000000 UO DDD 00 DDD DDD 0 D 0 0 
D sIGIO 0 


void sowwakeup (struct sockets) U 


0166 DDDUUDDUUDDUDDUD 






















































































































































































































































































11674 0000000090 000000000000 U U U U U 00 U 
m|] m0|] n|] control mbuf sb 
o 0 o D 
sbspace sog D D DDD «emu»: 
min(sb_hiwat - sb cc), (sb_mbmax - sb_mbcont) 
long sbspace (struct sockbufsby[] 
sballoc [] ml] B. set] 00000 sb O sv. << sb mbent 
void sballoc(struct sockbufsh, struct mbuf n [] 
sbfree Osho OO m] OO U 0 so I sb. <el) sb. mbent 
int sbfree(struct sockbufsh, struct mbuf m0 
sbappend 0 m[] O mbuff [] so 000 
int sbappend(struct sockbufsb” struct mbufmj]l] 
sbappendrecord [] mU) 00000 sen ü ü B Ul sbcompress 
int sbappendrecord(struct sockbufs& struct mbuf m0)[] 
0167 OO0000000000000000 
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0 H o d 


sbappendaddr asa 000000 mbufl] 0000 control] mol 0000 mbufl] 0000 

DU set) D D D 

int abappendaddr (struct 3b, struct sockaddrasa, 

struct mbuf m0, struct mbuf control) [|] 

sbappendcontrol O control] mo) DO D] O mbuf 000000050000 

int abappendcontrol(struct sb, struct mbufm®, 
struct mbuf control) [] 

O0s0000000000 

struct sockbufsb, struct mbuf m)[] 

00000 

struct sockbufsh, struct mbuf ms 
struct mbuf øm» 











sbinsertoob m000000 


i 


la] 


t abinsertoob 





( 
sbcompress TT m DD au H 0 
( 


void abcompress 















































sbdrop O O so O len O O 
void sbdrop(struct sockbufs int len) U 

sbdroprecord D D so OO000000000000000000 
void sbdroprecord(struct sockbufsb3[] 

sbrelease O O soflusal] O so D] O O mbuti [| O sb. hiwat[] sb mbmax[] 0 
void sbrelease(struct sockbuf sb) |] 

sbflush O D] s5000 0 mbuf 
void sbflush(struct sockbutfsb5[] 

soreserve 000000000000 (high-water and low-water máhfk) 
00000000 sbreserve 0000 sndee] 00000000 
sbreservel] 0 000 revecd 00000000000 sb_iowatQ 0000 
DU D (D 164000000000 0000 ENopurs 





int soreserve(struct socketso, int sndcc, int rcvcc)[] 


sbreserve 0s000000000c00000000000c0 000000000 


int sbreserve(struct sockbufs%& int cc)[] 























U 16-7 (17) 


16.4 write[] writev[| sendto[] sendmsg[] || O [| 
















































































































































































































































































































































































O O O write writev[] sendtol] senansg] LH U D D U WO WW 000000000 
OOOOOOO0000000000000000 sendamssD D D D D U D U DI UE D 0 U 
sosend[] sosenal] [| | uut 
000000000 U U DU 00 00 DUD DU 0 16-80 00 sosend 00000 
U U D U U 0 DD 0 0 D 0 U U 16-83 DU U U D U 0 D 0 U U UD U D 0 0 U 
soo write 0000000090 
016210000000 00000000 (sena) J J Ú 
O Net/3] O0 send I] 000000 senatod I U (U U U (1 (1 U) U (U U) U 
U U U D 00 D 00 UU sendi) I Ul lll esenall O U U DU U D D U 
U D 16-90 O00 U OO writel] writevl] popo0000000000 
OOOOOOOOO U 

















































































































O O pr usrred] DD 
PRU SEND PRU SENDOOB 


D 168 000000000 sesen 0 0 



















































































































































































































































































































































































































































































































































































U U U DDD D U D ODO U D D 0 l 0? |0000? 
U D D 0 
write U D D 1 
writev 0000 [1..UIO MAXIOV] 
send od 1 . 
sendto DO 1 . . 
sendmsg DD [1..UIO-MAXIOV] . . . 
0169 90000 
16-9 writev[] sendmsg 
(gathering) 
(scattering) iovec 
| UIO MAXIOV 16-10 iovec 
uio.h 
41 struct iovec ( 
42 char *iov base; /* Base address */ 
43 Size t iov len; /* Length */ 
44 y; = 
uio.h 


[] 16-10 iovec [] [] 






































41-44 16-10 iov base iov len 
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China-pub.tom 





























iovec 
















































































































































































writev 






































































































































16-11 





























iovec 

















iovent 






























































iovp 


writev 


























































































































iovp 











iovcnt-1 


Niovent-1 





i ovent-1 bytes 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































016-11 writev 00000 iove 00 
write|| writev|| send 
connect 
sendto|| sendmsg 
connect 
16-9 send xxx 16-12 
flags [] U O O 
MSG_DONTROUTE 00000000000 [] 16-23 
MSG DONTWAIT 000000000000 O 16-22 
MSG EOR OOOOOOOOOOO 16-25 
MSG OOB H H H H [] 16-26 
[] 16-12 send xxx[] 0 0 OD O flags J 
16-9 sendmsg 
msghdr([] 16-13) sendmsg 
socket.h 
228 struct msghdr { 
229 caddr_t msg_name; /* optional address */ 
230 u int msg namelen; /* size of address */ 
231 struct iovec *msg_iov; /* scatter/gather array */ 
232 u_int msg_iovlen; /* # elements in msg_iov */ 
233 caddr_t msg control; /* ancillary data, see below */ 
234 u_int msg_controllen; /* ancillary data buffer len */ 
235 int msg_flags; /* Figure 16.33 */ 
236 }; 
socket.h 
O 16-13 msghdr DI 
msg name sockaddr 
228-236 msghdr (msg. name[] msg. namelen) / 
(msg iov[] msg. iovlen) (msg control[]|] msg controllen) 

































































Chi asul COM 16 vo 387 


















































































































































(msg_flags) cmsghdr 16-14 
251 struct cmsghdr { socket} 
252 u_int cmsg_len; /* data byte count, including hår */ 
253 int cmsg level; /* originating protocol */ 
254 int cmsg type; /* protocol-specific type */ 
255 /* followed by u_char cmsg_data[]; */ 
256 }; 
socket.h 





O 16-14 emsghar [] [] 








































































































251-256 cmsg_type 

























































































































































































cmsg_len 






























































16-15 sendmsg[] msghdr 


#————msg_namelen —— o, oÑaÑ 

































































msghdr() 












M0 8 g_controllen—əj  . s  [ ə ll 
O 16-15 sendmsg ] O 0 OU msghar [| [| 


16.5 sendmsg | [ [| [| 















































































































































































































































































































































































































































































































































































































































































































































sendmsg API sendmsg 
sendit sosend sosend 
SOCK_DGRAM SOCK_STREAM 
SOCK SEQPACKET ( 
) ( ) SOCK PDM 
( ) 
sosend SOCK SEQPACKET|| SOCK_PDK 
Internet 
16-16 sendmsg 
307-319 sendmsg msghdr 










































































































































































































































































copyin[| nsghdr 











3 88 TCP/IP 2 












































307 struct sendmsg_args { 


308 
309 
310 
311 }; 


int S; 
caddr t msg; 
int flags; 


312 sendmsg(p, uap, retval) 
313 struct proc *p; 
314 struct sendmsg args *uap; 


315 int 


316 ( 
317 


*retval; 


struct msghdr msg; 
































China-pub.tom 


uipc_syscalls.c 


uipc_syscalls.c 




































































































































































































































































































































































































































































































































































318 struct iovec aiov[UIO SMALLIOV], *iov; 
319 int error; 
320 if (error = copyin(uap->msg, (caddr t) € msg, sizeof (msg))) 
321 return (error); i 
322 if ((u_int) msg.msg_iovlen >= UIO_SMALLIOV) { 
323 if ((u int) msg.msg_iovlen >= UIO_MAXIOV) 
324 return (EMSGSIZE); 
325 MALLOC (iov, struct iovec +, 
326 sizeof (struct iovec) + (u int) msg.msg_iovlen, M_IOV, 
327 M_WAITOK) ; 
328 ) else 
329 iov = aiov; 
330 if (msg.msg_iovlen && 
331 (error = copyin((caddr t) msg.msg iov, (caddr_t) iov, 
332 (unsigned) (msg.msg iovlen + sizeof(struct iovec))))) 
333 goto done; 
334 msg.msg iov = lov; 
335 error = sendit(p, uap->s, &msg, uap->flags, retval); 
336 done: 
337 if (iov != aiov) 
338 FREE (iov, M_IOV); 
339 return (error); 
340 } 
O 16-16 sendmsg [1 [] O O 
1. iov 
320-334 8 (UIO SMALLIOV)[] iovec 
sendmsg MALLOC 
1024(UIO_MAXIOV) EMSGSIZE[| copyin|| iovec 
malloc 
8 



































2. sendit[] cleanup 















































































































































































































































































































































































































































335-340 sendit sendmsg 
iovec ( ), sendit 
16.6 sendit|] [| 
sendit sendtol| sendmsg sendit uio 
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sosend uiomove 
























































uio 

















16.6.1 uiomove[l |] 


















































uiomove 





int uiomove(caddr t cp, int n, struct uio *uio); 

































































































































































































































































































































































































































































































































































































































































































































































































































































uiomove cp uio iovec 
n 16-7 uio uiomove 
- uio.h 
45 enum uio rw L 
46 UIO READ, UIO WRITE 
47 Y; 
48 enum uio_seg { /* Segment flag values */ 
49 UIO_USERSPACE, /* £rom user data space */ 
50 UIO_SYSSPACE, /* from system space */ 
51 UIO USERISPACE /* from user instruction space */ 
52 ); 
53 struct uio ( 
54 struct iovec *uio_iov; /* an array of iovec structures */ 
55 int uio iovent; /* size of iovec array */ j 
56 off t uio offset; /* starting position of transfer */ 
57 int uio resid; /* remaining bytes to transfer */ 
58 enum uio, seg uio segflg; /* location of buffers */ 
59 enum uio rw uio rw; /* direction of transfer */ 
60 struct proc *uio, procp; /* the associated process */ 
61 }; ji 
uio.h 
O 16-17 wol Ú 
45-61 uio | uio iov|f| iovec | uio offset|| 
uiomove IUU uio resid uiomove 
uio offset n, uio resild[|n uiomove uio iov 
uio iov uio iov uio segflg 
uio iov uio rw 































































































































































































16-18[] uiomove 
































































































































uiomove 














uio segflg uio rw O O 





UIO_USERSPACE UIO-READ 020000 cp 00-00000000 
UIO USERISPACE 


UIO USERSPACE UIO-WRITE 0020000000 -00000000 ee 

UIO USERISPACE 
UIO SYSSPACE UIO-READ U D D H D cp U H n 0000000000 

UIO-WRITE | D D 0000000000000000 e0 









































O 16-18 uiomove [] [] 


390 


16.6.2 























TCP/IP 












































16-19 





















































uio 






uio_iovent 
uio_offset 









































uiomove uio 





China-pubecom 


—— uio_resid — 






O 16-19 [] [| uiomove [] O wol] 























































































































































































































































































































































































































































































































ulo_iov iovec iov base 
uio offset ol] uio resid 
cp mbuf| 16-20 
uiomove uio 
uiomove(cp, n, uio); 
ke——uio offset — —PJ— — uio resid — 
ll À. Le S hr KAA ss asa 
DO 
. ulo() iov_len iov_base 
uio 7 7 
uio_iov 
uio_iovent |2 not"n-n 
uio offset |n no 


LBS. 


uio resid 
uio segflg 
uio rw 

uio, procp 


(ng T H T Ha) H 
UIO_USERSPACE 
UIO_WRITE 


AAA Poo 


}*———uio_offset——» 

















O 16-20 [] [| uiomove [] [| wo] O 

































































































































































ny&n&ngtn,) 










































































































































































































































































































































































uiomove 0 uio iov 
iovec 
uio offset n|| uio resid n 
uio rw UIO WRITE. 
















































































































































































































































































































































































































































































































































































































































































































































































































































































16.6.3 sendit 
sendit 16-21 
1. auio 
341-368 sendit getsock file uio 
for 
uio resid if if 
uio_resid uio_resid iov_len 
2. 
369-385 ‚|| sockargs 
- : uipc_syscalls.c 
341 sendit(p, s, mp, flags, retsize) 
342 struct proc *p; 
343 int s; 
344 struct msghdr *mp; 
345 int flags, *retsize; 
346 ( 
347 struct file *fp; 
348 struct uio auio; 
349 struct iovec *iov; 
350 int i; 
351 struct mbuf *to, *control; 
352 int len, error; 
353 if (error = getsock(p->p_fd, s, &fp)) 
354 return (error); 
355 auio.uio_iov = mp->msg_iov; 
356 auio.uio_iovent = mp->msg_iovlen; 
357 auio.uio segflg = UIO_USERSPACE; 
358 auio.uio rw = UIO WRITE: 
359 auio.uio procp = p; 
360 auio.uio offset = 0; /* XXX */ 
361 auio.uio_resid = 0; 
362 iov = mp->msg_iov; 
363 for (i = 0; i < mp->msg iovlen; i++, iov++) { 
364 if (iov->iov len < 0) 
365 return (EINVAL); 
366 if ((auio.uio_resid += iov->iov_len) < 0) 
367 return (EINVAL); 
368 } : 
369 if (mp->msg name) ( 
370 if (error - sockargs(&to, mp-»msg name, mp-»msg namelen, 
371 MT SONAME)) 


O 16-21 sendit [] [J 


392 
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372 return (error); 
373 } else 
374 to = 0; 
375 if (mp->msg_control) { 
376 if (mp->msg controllen < sizeof (struct cmsghdr) 
377 ) I 
378 error = EINVAL; 
379 goto bad; 
380 } 
381 if (error = sockargs(&control, mp->msg control, 
382 mp->msg_controllen, MT CONTROL) ) 
383 goto bad; 
384 ) else 
385 control = 0; 
386 len = auio.uio_resid; 
387 if (error = sosend((struct socket *) fp->f data, to, &auio, 
388 (struct mbuf *) 0, control, flags)) ( 
389 if (auio.uio resid != len && (error == ERESTART || 
390 error == EINTR || error == EWOULDBLOCK) ) 
` 391 error = 0; 
392 if (error == EPIPE) 
393 psignal(p, SIGPIPE); 
394 ) 
395 if (error == 0) 
396 *retsize = len - auio.uio resid; 
397 bad: 
398 if (to) 
399 m freem(to); 
400 return (error); 
401 } 
uipc syscalls.c 
O 16-21 (O) 
3. 
386-401 sosend uio_resid 
len uio sosend 
sosend sendit 
. sosend 
° sosend EPIPE SIGPIPE error 0 
PIPE 
S ( ) *retsize 
sendit o[] syscall(|] 15.4] ) *retsize 
. 
sendit sosend control 




































































































































































16.7 sosend{] [] 


sosend 16-8 


























SOS 
































































































































































































































































































































end| | sosend 











16 vo 393 















































































































































pr_usrreq 























sosend 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































sosend sb_hiwat|| sb_lowat 
16.7.1 Oooo HH 
sb_cc Oz sb ccz sb hiwat 
sb. cc sb hiwat 
sosend pr_usrreg 
sosend 
° PR_ATOMIC|| sosend 
sosend 
mbu pr usrreq RDP[] SPP 
° PR ATOMIC[] sosend mbu 
mbuf SOCK STREAM TCP 
SOCK SEQPACKET TP4 TP4 MSG EOR ( 
16-12) sosend 
TCP TCP TCP 
4096 
2048 mbuf] TCP 
2048 
sosend 
sb_lowat TCP sb_lowat 
2048 ([] 16-4) TCP 
16.7.2 
([] UDP) 
sb_cc O[] sb hiwat 
16-4 UDP sb hiwat 9216(9x 1024) 
SO SNDBUF sb hiwat 9216 
1 11.10 
TCP/IP 
NFS 9216 NFS 
8192 






































394 





TCP/IP 2 


























China-bubcom 














16-22 













































































sosend 

























































































uipc_socket.c 

































































































































































































































































































































271 sosend (so, addr, uio, top, control, flags) 
272 struct socket *so; 
273 struct mbuf *addr; 
274 struct uio *uio; 
275 struct mbuf *top; 
276 struct mbuf *control; 
277 int flags; 
278 { 
305 restart: 
306 if (error = sblock (&so->so_snd, SBLOCKWAIT(flags))) 
307 goto out; 
308 do { /* main loop, until resid == 0 */ 
342 do { 
343 if (uio == NULL) { 
344 JE 
345 * Data is prepackaged in "top". 
346 */ 
347 resid = 0; 
348 if (flags & MSG_EOR) 
349 top->m_flags |= M_EOR; 
350 } else 
351 do { 
396 } while (space > 0 && atomic); 
412 } while (resid && space > 0); 
413 } while (resid); 
414 release: 
415 sbunlock (&so->so_snd) ; 
416 out: 
417 if (top) 
418 m freem(top); 
419 if (control) 
420 m freem(control); 
421 return (error); 
422 ) 
uipc socket.c 
O 16-22 sosend [] (] [0 Ü 
271-278 sosend so addr 
uio VO uio top mbuf 
control mbu flags 
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uio top 
(O NFS) mbu sosend[] top mbuf| uio 
279-304 U U U 
1. 
305-308 sosend restart sblock 
flagsl| MSG DONTWAIT SBLOCKWAIT M_NOWAIT 
M_NOWAIT sblock EWOULDBLOCK 
MSG_DONTWAIT Net/3 NFS 
| (O resid=0) 
2. 
309-341 sosend 
sosend 
restart 
3 top 
342-350 sosend | | 
uio | ( top] [| [| mbu ) sosend MSG_EOR 
M_EOR mbu 
4. 
351-396 uio sosend PR ATOMIC ( 
UDP) mbu sosend 
break([] 16-22 break) sosend 
5. 
395-414 PR_ATOMIC | E resid 0 
release PR ATOMIC 
sosend mbuf| 
sosend mbu 
6. 
414-422 mbu 
sosend 
N (U 16-23) 
° ([] 16-24) 
° ([] 16-25) 
° (O 16-26) 
sosend 16-23 
7. Ú 
279-284 sosendallatonce[][] true([] PR ATOMIC[I] JO DO EB OT 























































































































396 TCP/IP 2 China-pubecom 
e 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































top mbu sosend atomic mbuf 
mbu 
285-297 resid iovec top mbu 
16.1 resid 
uipc_socket.c 
279 struct proc *p = curproc; /* XXX */ 
280 struct mbuf **mp; 
281 struct mbuf *m; 
282 long space, len, resid; 
283 int clen = 0, error, s, dontroute, mlen; 
284 int atomic = sosendallatonce (so) || top; 
285 if (uio) 
286 resid = uio-»uio resid: 
287 else 
288 resid = top-»m pkthdr.len; 
289 /* 
290 * In theory resid should be unsigned. 
291 * However, space must be signed, as it might be less than 0 
292 * if we over-committed, and we must use a signed comparison 
293 * of space and resid. On the other hand, a negative resid 
294 * causes us to loop sending 0-length segments to the protocol. 
295 */ 
296 if (resid « 0) 
297 return (EINVAL); 
298 dontroute - 
299 (flags & MSG DONTROUTE) && (so-»so options & SO DONTROUTE) 22 0 && 
300 (so-»so proto-»pr flags & PR ATOMIC); 
301 p-»p stats-»p ru.ru msgsnd++; 
302 if (control) 
303 clen - control-»m len; 
304 #define snderr (errno) { error = errno; splx(s); goto release; ) _ 
: uipc_socket.c 
O 16-23 sosend [IN Ú] Ú] Ü 
8. 
298-303 dontroute 
clen 
304 snderr out 
16-24 sosend 
309 
sosend 
310-311 * ( TCP ) EPIPE 
312-313 * ( ICMP 
) so_error sendit 
([] 16-21 389 ) 
314-318 * ENOTCONN 
sosend 
Internet TP4 































































































































































































Chinaspubecom mm tw 397 















































































































































































































































































































































319-321 ® ( send 
connect ) EDESTADDREO 
uipc_socket.c 
309 s = splnet(); 
310 if (so->so_state & SS_CANTSENDMORE) 
311 snderr (EPIPE); 
312 if (so->so_error) 
313 snderr (so->so_error); 
314 if ((so->so_state & SS_ISCONNECTED) == 0) { 
315 if (so->so_proto->pr_flags & PR_CONNREQUIRED) { 
316 if ((so->so_state & SS_ISCONFIRMING) == 0 && 
317 l (resid == 0 && clen != 0)) 
318 snderr (ENOTCONN) ; 
319 } else if (addr == 0) 
320 snderr (EDESTADDRREQ) ; 
321 } 
322 space = sbspace(&so-»so, snd) : 
323 if (flags & MSG OOB) 
324 Space += 1024; 
325 if (atomic && resid » so-»so snd.sb hiwat || 
326 clen » so-»so snd.sb hiwat) 
327 snderr (EMSGSIZE); 
328 if (space < resid + clen && uio && 
329 (atomic || space < so->so_snd.sb_lowat || space < clen)) { 
330 if (so->so_state & SS_NBIO) 
331 snderr (EWOULDBLOCK) ; 
332 sbunlock (&so->so_snd) ; 
333 error = sbwait (&so->so_snd); 
334 splx(s); 
335 if (error) 
336 goto out; 
337 goto restart; 
338 } 
339 splx(s); 
340 mp = &top; 
341 space -= clen; 


uipc_socket.c 


O 16-24 sosend U 0 0 0 0 0 D 0 UD 






















































































322-324 sbspace 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































sb_mbmax 
mbuf[] [| (O 16-6)[] sosend 1024 
10. 
325=327 atomic (high-watermark) 
EMSGSIZE 
EMSGSIZE 
11. ? 
328-329 ( top) 
sosend 













































































































































































398 TCP/IP 2 China-pub.com 
se 




























































































































































































































































































































































































































































































































































































































































































° (atomic ) 
top sosend ( uio ) mbuf 
sosend 
[Crowcroft et al. 1992] 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































12. 
330=338 sosend EWOULDBLOCK 
sosend sbwait sbwait 
sosend restart 
sbwait SO_SNDTIMEO 
sb_timeo EWOULDBLOCK 
16-21 sendit 
mbuf 
339-341 sosend splx 
sosend mp 
mbuf sosend 
(clen) 
16-25 sosend mbuf 
13. mbuf 
351-360 atomic 
mbuf atomic 
top 
14. 
361-371 space 
MCLBYTES MCLGET mbuf| Space MCLBYTES 
2048 resid MCLBYTES 
MCLGET sosend nopages mbu 
MINCLSIZE > 2 208(MINCLSIZE) 
mbu 
atomic ( UDP) mbu 
max hdr 
atomic ( TCP) sosend 
space (2048 ) len len 
( 16-2) 






























































China-bubco «usw 399 





























































































































































































































































































































































































































































































































uipc socket.c 
351 do ( 
352 if (top == 0) { 
353 MGETHDR (m, M WAIT, MT DATA); 
354 mlen = MHLEN; 
355 m-»m pkthdr.len = 0; 
356 m->m_pkthdr.rcvif = (struct ifnet +) 0; 
357 } else { 
358 MGET (m, M WAIT, MT DATA); 
359 mlen = MLEN; 
360 } 
361 if (resid >= MINCLSIZE && space >= MCLBYTES) { 
362 MCLGET (m, M_WAIT); 
363 if ((m-»m flags & M EXT) == 0) 
364 goto nopages; 
365 mlen = MCLBYTES; 
366 if (atomic && top == 0) { 
367 len = min(MCLBYTES - max hår, resid); 
368 m->m data += max hdr; 
369 } else 
370 len = min(MCLBYTES, resid); 
371 space -= MCLBYTES; 
372 } else { 
373 nopages: 
374 len = min(min(mlen, resid), space); 
375 space -= len; 
376 LE i 
377 * For datagram protocols, leave room 
378 * for protocol headers in first mbuf. 
379 */ 
380 if (atomic && top == 0 && len < mlen) 
381 MH ALIGN(m, len); 
382 } 
383 error = uiomove(mtod(m, caddr t), (int) len, uio); 
384 resid = uio->uio resid; 
385 m->m len = len; 
386 *mp = m; 
387 top->m_pkthdr.len += len; 
388 if (error) 
389 goto release; 
390 mp = &m->m next; 
391 if (resid <= 0) ( 
392 if (flags & MSG EOR) 
393 top->m flags |= M EOR; 
394 break; 
395 } 
396 } while (space > 0 && atomic); 
uipc_socket.c 
[] 16-25 sosend [] H1 D] HU D] U 
15. mbuf 
372-382 mbuf (1) 
mbu (2) (3) 
atomic MH ALIGN 
mbuf| MH ALIGN 
mbuf| atomic 




















































































































































































































400 TCP/IP 2 

























































































China-pubecom 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































16. 
383-395 uiomove len mbuf| mbu 
mbu mbuf([] top mbuf) mbu 
sosend release 
MSG_EOR M_EOR 
sosend 
MSG_EOR OSI TP4[] TCP 
MSG_EOR 
17. ? 
396 atomic[| sosend mbuf] 
space>0 atomic space 
mbu atomic 
16-2 
sosend mbuf 16-26 
uipc_socket.c 
397 if (dontroute) 
398 so->so_options |= SO_DONTROUTE; 
399 s = splnet(); /* XXX */ 
400 error = (*so->so_proto->pr_usrreq) (so, 
401 (flags & MSG OOB) ? PRU_SENDOOB : PRU SEND, 
402 top, addr, control); 
403 splx(s); 
404 if (dontroute) 
405 so->so options &= ^SO DONTROUTE; 
406 clen = 0; 
407 control = 0; 
408 top = 0; 
409 mp = &top; 
410 if (error) 
411 goto release; 
412 } while (resid && space > 0); 
413 } while (resid); i 
uipc socket.c 
O 16-26 sosend [I 0000 
397-405 SO_DONTROUTE 
16-23 
MSG_DONTROUTE 
pr usrreq pr usrreq splnet 
splx (OU UDP) 
sosend PRU SENDOOB 
PRU. SEND] | mbu 
406-413 clen[| controll] top|] mp 
mbu atomic (U TCP)[] resid 








































































































































































































16 
































































































































I/O 


401 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































0 sosend 
mbuf] sosend ([] 16-24) 
230 0 UDP 0 26[] 0 
| I O TCP 
16.7.3 sosend{] | ] 
sosend | 142 3 goto 
PR ATOMIC 
NFS MSG DONTWAIT mbuf] 
SS ISCONFIRMING MSG EOR OSI 
u | | H sosend[] | pr. send 
protosw [Partridge and Pink 1993] 
16.7.4 E 
16-25 sosend mbu 
mbuf 
[Jacobson 1998a] 
mbuf(204 ) CPU 
mbuf mbuf 
[Jacobson 1998a] 2096 
([] 1 20.7 
) [ | [] TCP 0 20 E 
20 TCP 
16.8 read|] readv[] recv£rom[] recvmsg|| || [| [] 
read|| readv|| recvfrom|| recvmsg 
recvmsg recvmsg 
16-27 (recv) 
[] U (0000 DUDU NDOODDOOODOD?ID uU? 000000? 
read D UO D C 1 
readv Hogg [1..UIO MAXIOV] 
recv O O 1 . 
recvfrom OO 1 . 
recvmsg OO [1..UIO-MAXIOV] . . . 
U 16-27 020000 
Net/3 recv recvfrom 





































































































































































































402 iu China"pub.tom 
trutt l 

























































































































































































































































































































































































































































































































































































recv orecv 
recvfrom 
read|| readv 
iovec recvfrom 
recvmsg getpeername 
16.11 
soreceive 16-28 












































































































































































































































Soo read 


OD pr usrreg] 00 PRU_RCVD B : 


[] PRU. RCVOOB 


O 16-28 000000 0 soreceive DO 

















16-28 





































































































































































































16.9 recvmsg| [| [| [] 



























































































































































recvmsg 









































































































































































































































16-29 recvmsg 







































































































































































433-445 recvmsg msghdr 



























































1. iov 


















































































































































446-461 sendmsg recvmsgl| msghdr 




















China-bubco em un” 403 









































































































































aiov iovec iov 


(U 16.4[] ) msghdr 



























































































































































uipc syscalls.c 
433 struct recvmsg args ( 


434 int S; 

435 struct msghdr “msg; 
436 int flags; 

437 1; 


438 recvmsg(p, uap, retval) 
439 struct proc *p; 
440 struct recvmsg_args *uap; 


441 int *retval; 

442 { 

443 struct msghdr msg; 

444 struct iovec aiov[UIO_SMALLIOV], *uiov, *iov; 

445 int error; 

446 if (error = copyin((caddr t) uap->msg, (caddr t) & msg, sizeof(msg))) 
447 return (error); 

448 if ((u int) msg.msg iovlen >= UIO SMALLIOV) 4 

449 if ((u int) msg.msg iovlen >= UIO MAXIOV) 

450 return (EMSGSIZE); 

451 MALLOC(iov, struct iovec *, 

452 sizeof(struct iovec) * (u int) msg.msg iovlen, M IOV, 

453 M WAITOK); 

454 ) else 

455 iov - aiov; 

456 msg.msg flags - uap-»flags; 

457 uiov = msg.msg iov; 

458 msg.msg iov - iov; 

459 if (error - copyin((caddr t) uiov, (caddr t) iov, 

460 (unsigned) (msg.msg iovlen * sizeof(struct iovec)))) 
461 goto done; 

462 if ((error = recvit(p, uap->s, &msg, (caddr t) 0, retval)) == 0) { 
463 msg.msg_iov = uiov; 

464 error = copyout((caddr t) & msg, (caddr_t) uap-»msg, sizeof(msg)); 
465 } 

466 done: 

467 if (iov != aiov) 

468 FREE (iov, M_IOV); 

469 return (error); 

470 } 





uipc_syscalls.c 


[ 16-29 recvmsg 0 000 





2. recvit 


































































































































































































462-470 recvit msghdr 





































































































iovec 

































































16.10 recvit[| |] 






























































































































































































































































recvit recv[] recvfrom|] recvmsg 16-30 recv xxx 
msghdr recvit soreceive uio 
471-500 getsock s file recvit uio 
iovec msg iovlen 









































































































































































































































404 rem 03 Lmzchuktnh 
trutt pg) 















































uio resid len 






























































—— uipc_syscalls.c 





471 recvit(p, s, mp, namelenp, retsize) 
472 struct proc *p; 

473 int s; 

474 struct msghdr *mp; 

475 caddr_t namelenp; 




































































































































































476 int *retsize; 
477 1 
478 struct file *fp; 
479 struct uio auio; 
480 struct iovec *iov; 
481 int 1; 
482 int len, error; 
483 struct mbuf “from = 0, *control = 0; 
484 if (error = getsock (p->p_fd, s, &fp)) 
485 return (error); 
486 auio.uio_iov = mp->msg_iov; 
487 auio.uio_iovent = mp->msg_iovlen; 
488 auio.uio segflg = UIO USERSPACE; 
489 auio.uio rw = UIO READ; 
490 auio.uio procp = p; 
491 auio.uio offset = 0; /* XXX */ 
492 auio.uio resid = 0; 
493 iov = mp->msg iov; 
494 for (i = 0; i < mp-»msg iovlen; i++, iov++) { 
495 if (iov->iov len < 0) 
496 return (EINVAL); 
497 if ((auio.uio resid += iov->iov len) < 0) 
498 return (EINVAL); 
499 } 
500 len = auio.uio_resid; 
uipc_syscalls.c 
[] 16-30 recvit [| [ DO OD uie [] LU 
recvit soreceive 16-31 
uipc_syscalls.c 
501 if (error = soreceive((struct socket *) fp->f_data, &from, &auio, 
502 (struct mbuf **) 0, mp->msg control ? &control : (struct mbuf **) 0, 
503. &mp-»msg flags)) { 
504 if (auio.uio resid !- len && (error -- ERESTART || 
505 error -- EINTR || error -- EWOULDBLOCK)) 
506 error - 0; 
507 T 
508 if (error) 
509 goto out; 
510 *retsize = len - auio.uio_resid; 
511 if (mp->msg name) { 
512 len = mp->msg_namelen; 
513 if (len <= 0 || from == 0) 
514 len = 0; 
515 else { 
516 if (len > from->m len) 
517 len = from->m len; 
518 /* else if len < from->m len ??? */ 
519 if (error = copyout (mtod(from, caddr_t), 


DH 16-31 recvit [900000 





Chinaspubscom «un 405 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































520 (caddr_t) mp->msg_name, (unsigned) len)) 
521 goto out; 
522 } 
523 mp->msg_namelen = len; 
524 if (namelenp && 
525 (error = copyout((caddr t) & len, namelenp, sizeof(int)))) { 
526 goto out; 
527 } 
528 } 
529 if (mp->msg control) { 
530 len = mp->msg_controllen; 
531 if (len <= 0 || control == 0) 
532 len = 0; 
533 else { 
534 if (len >= control->m_len) 
535 len = control->m_len; 
536 else 
537 mp->msg_flags |= MSG_CTRUNC; 
538 error = copyout ((caddr_t) mtod(control, caddr_t), 
539 (caddr t) mp->msg control, (unsigned) len); 
540 } : 
541 mp->msg_controllen = len; 
542 } 
543 out: 
544 if (from) 
545 m freem (from) ; 
546 if (control) 
547 m freem(control); 
548 return (error); 
549 3 . 
uipc. syscalls.c 
O 16-31 (0) 
1. soreceive 
501-510 soreceive 
*retsize 
(Zen[] | uio resid) 
WA 
511-542 recvit 
soreceive 
namelenp (| sockaddr ) 
msg_flags MSG_CTRUNC 16-7 
3. 
543-549 out mbu 





























































































































16.11 soreceive|] |] 





























































































































soreceive 











































































































































































































































































































































































































406 ama 0: Chinaspubecom 
— TT «$< Tum 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































16-32 soreceive 
flags U 0 [] U 
MSG DONTWAIT 020000000090 [] 16-38 
MSG OOB O0000000000000 [] 16-39 
MSG PEEK O000000000000 [] 16-43 
MSG WAITALL 000000000000 [] 16-50 
O 16-32 rev LH BH B] H B. B]. | | B. D] DUU 
recvmsg 
16-33 msghdr[] recvmsg Ü] 
msg flags L ü U [] 
Msc CTRUNC | 0000000000000000 
MSG_EOR O000000000000000 
MSG OOB 00000000 
MSG TRUNC O0000000000000000 
U 16-33 recmsg O TO 0 Ú D 0 0 Ú D msg flag |] 
161171 | EL 
(OOB) 
OOB OOB 
OOB OOB UDP 
OOB TCP OOB TCP 
sendxxx MSG_OOB OOB sosend 
OOB 
recvxxx MSG OOB OOB 
SO OOBINLINE ( 17.30 0000 OOB 
SO_OOBINLINE OOB 
MSG_OOB OOB 
OOB recvmsg 
MSG_OOB OOB 
OOB 
OOB SIOCATMARKioct]] 
OOB 
| LU L u 
OOB 
16.11.2 





























16-34 A-I 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































U D 0000 
O 16-34 O00000 
A-I MSG_OOB J 
9 (A-D 9 
I SIOCATMARK J 
SIOCATMARK A-I J-L 
16-34 J TCP 
K 29.7 
16.11.3 
MSG_PEEK 
MSG_PEEK 
MSG_WAITALL soreceive 
MSG_WAITALL soreceive 
NFS[] Net/3 MSG_WAITALL| | MSG_DONTWAIT 
ioctl|| fentl 1/0 MSG DONTWAIT 
16.11.4 







































































































































































mbu 









































































































































408 TCP/IP G 20 








China-pub.com 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































[| m_nextpkt 0 000000 mburi O dq] 2-2D0000000000000000000 
U U U U 00000000000 UU | U U U U 

JO PR. ATOMICII IO O LE] L] uut uut 0000000000 
0000000000 TCP 0200000090 00000 
U U PR_ATOMICH UUUUUUUUUUULD LU LU U U U 
UDPI] U U U U U U U U U OOOO 

PR_ADDR[] 10000 0 sbappendaddr]] O [| [| mburi O 0000 

U U U LU LU U D U U mbuff] OG | | O mbuf[] 0 U U U U 
OOO mbufli 

O [| sock SEQPACKET[] SOCK_RDML IU ID D] L] DÚ 0000 mbuf] (T ODO 
PR_ATOMIC U sbappendrecord I II DU D| LU EL EL U U LÍ 
PR ATOMIC[][ OOO (OSIO TPAO O O sbappendrecord] [I [| 0200009090 
O I] spappenal] D H U O 

O00 PR ATOMIC DD TP4 

PR ATOMIC U M EOR [III D HE EIL UD E] U 

U 1635000000 mbuf 000000 MUU UDP DU D D D D U D D D] 0 mbufl] 
OOOm type] UU 

OU O 16-350 U U UD 0 0 D D 0 D D UD UD UDP D 0 0 D D D 0 D 0 D 0 U 
U U D 0 DU U U 22-50 D] 23-70 
















































































sb lowat [ [| | 









































16.115 HÆR 












































0 16-35 QOOO0000 UDPD D B B 
U U PR ATomN D H B. D] 0 HL sb_lowat D U D U U PR_ATOMIC[] [] 
OOOOO00000000000000000 16-410 D] O 
B Hmgmpiuttb 
0200000000 (0 sock STREAM O D D TOP D ODO sbappendl O O O 


UU 
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00000000 mburi) D 0 D 0 D 0 D 0 0 D 0 0 0 D 0 D 0 D 0 D 0 0 0 0 U 
U U UU sp 10wat U D U D D U 0 0 D 0 U D 0 0 D U 0 0 D D 0 U 
U 16-36] D 0000000000 TCPD 0000000 
socket (1 

















































































































O 16-36 TCPO so xcv OQ 





16.11.6 [] HHH I 

















ug TCP] IDD DUDDDDDUUUDDUUDUDUDLDD sbappendcontro1] [ODDO 
U U U 0 U mbuf | UU 000000 OOB 
sbinsertoob| | [| 0000 mbuf 070000 OOBU UU mbuf [1 D] E] D] E] U E] U HE D Ú 
U U U mbu D D 0 0 D D D 0 0 D D 00 0 0 D 0 U 0 0 0 0 0 0 


O0 1630040000000 O0B 0000000000 
socket () 














































































































































































































[L1 
























































D 16-37 OO0O0000000Bp[ DU sore D D 











Unix 0000000000 OSITP40 000 MT_OOBDATA mbuf[] TCPO 
OOOOOOO mt.cobsbata 000000000 TC 0 000000000000 
0 (s0_00BINLINEJ O0 00000000000000 008000 TCPO 00000 
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410 regn 0 China"pub.tom 
tren ytt l 


29.7 























































































































16.12 soreceivel] |] 














soreceive soreceive 


(U 16-32) 














































































































































































































































































































soreceive 16-38 






























































































































































soreceive 











uipc_socket.c 


439 soreceive(so, paddr, uio, mp0, controlp, flagsp) 
440 struct socket *so; 

441 struct mbuf **paddr; 

442 struct uio *uio; 

443 struct mbuf **mp0; 

444 struct mbuf **controlp; 

445 int *flagsp; 


446 ( 

447 struct mbuf *m, **mp; 

448 int flags, len, error, s, offset; 
449 struct protosw *pr = so->so proto; 
450 struct mbuf *nextrecord; 

451 int moff, type; 

452 int orig resid = uio->uio_resid; 
453 mp = mp0; 

454 if (paddr) 

455 *paddr = 0; 

456 if (controlp) 

457 *controlp = 0; 

458 if (flagsp) 

459 - flags - *flagsp & ^MSG EOR; 

460 eise 

461 flags - 0; 





pis: 7 AN 
483 restart: 


484 if (error = sblock(&so->so rcv, SBLOCKWAIT (flags))) 
485 return (error); 

486 S - splnet(); 

487 m = so->so rcv.sb mb; 





542 dontblock: 


543 if (uio->uio procp) 
544 uio->uio procp->p stats->p ru.ru msgrev++; 
545 nextrecord = m-»m nextpkt; 





591 


U 16-38 soreceive 000090 





China=pubecom aos 411 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































592 if ((flags & MSG_PEEK) == 0) 

593 m-»m nextpkt = nextrecord; 

594 type = m->m_type; 

595 if (type == MT_OOBDATA) 

596 flags |= MSG_OOB; 

597 } 

693 } /* while more data and more space to fill */ 
























































































































































































































































































































































































































































































































































































































































































































































715 release: 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































716 sbunlock(&so-»so rcv); 
717 splx(s); 
718 return (error); 
Pa uipc socket.c 
U 16-38 (0) 
439-446 soreceive so mbu 
*paddr mp0 mbuf soreceive 
*mp0 mbu uio uio resid 
mp0 soreceive uio *controlp 
mbu soreceive 16-33 *flagsp 
447-453 soreceive pr uio resid( 
) orig_resid orig_resid 
0 uio_resid orig_resid 
uio, resid[] soreceive ([] 16-51) 
454-461 *paddr[] *controlp MSG EOR 0 
soreceive[] *flagsp flagsl] ( 16.8)]] flagsp 
recvmsg flagsp flags[] 0 
483-487 sblock flags 
MSG_DONTWAIT soreceive 
NFS 
soreceive m 
mbu mbu 
1; 
488-541 soreceive 
soreceive restart 






































































































































542-545 soreceive 



































































































































































































































































































































dontblock mbu nextrecord 
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2. 
542-545 
3. 
591-597 OOB soreceive 
soreceive 
4. 
598-692 mbuf (m ) (uio_resid>0) 
693-719 
16-39 soreceive[] OOB 
- uipc_socket.c 
462 if (flags & MSG_OOB) { 
463 m = m get (M WAIT, MT DATA); 
464 error = (*pr-»pr usrreq) (so, PRU_RCVOOB, 
465 m, (struct mbuf *) (flags & MSG PEEK), (struct mbuf *) 0); 
466 if (error) 
467 goto bad; 
468 do { i 
469 error = uiomove(mtod(m, caddr t), 
470 (int) min(uio->uio resid, m->m_len), uio); 
471 m = m free (m) ; 
472 ) while (uio->uio resid && error == 0 && m); 
473 bad: 
474 if (m) 
475 m freem(m) ; 
476 return (error); 
477 } š 
uipc socket.c 
0 16-39 soreceive 7 QU 010000 
5. OOB 
462-477 OOB soreceive mbu 
PRU_RCVOOB while uio 
soreceive 0 
PRU RCVOOB UDP EOPNOTSUPP TCP 
30.2 16-40 soreceive 
478 TE (mp) uipc_socket.c 
479 *mp = (struct mbuf *) 0; 
480 if (so->so_state & SS_ISCONFIRMING && uio->uio_resid) 
481 (*pr-»pr usrreq) (so, PRU RCVD, (struct mbuf *) 0, 
482 (struct mbuf *) 0, (struct mbuf *) 0); 
uipc_socket.c 
O 16-40 soreceive (000000 
6. 
478-482 mbuf *mp 
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SO ISCONFIRMING PRU RCVD 
SO ISCONFIRMING OSI TP4 TP4 
getpeername shutdown|| close 
16-38 16-41 soreceive 
uipc_socket.c 
488 /* 
489 * If we have less data than requested, block awaiting more 
490 * (subject to any timeout) if: 
491 * 1. the current count is less than the low water mark, or 
492 * 2. MSG WAITALL is set, and it is possible to do the entire 
493 * receive operation at once if we block (resid «- hiwat). 
494 * 3. MSG DONTWAIT is not set 
495 k 
496 * If MSG_WAITALL is set but resid is larger than the receive buffer, 
497 * we have to do the receive in sections, and thus risk returning 
498 * a short count if a timeout or signal occurs after we start. 
499 XI 
500 if (m == Il ((flags € MSG_DONTWAIT) == 0 && 
501 so->so_rcv.sb_cc < uio->uio resid) && 
502 (so-»so rcv.sb cc < so-»so rcv.sb lowat | | 
503 ((flags & MSG WAITALL) && uio->uio resid <= so-»so rcv.sb hiwat)) && 
504 m-»m nextpkt == 0 && (pr->pr flags & PR ATOMIC) == 0) : 
uipc socket.c 
O 16-41 soreceive [| [ 00000? 
7. ? 
488—504 soreceive 
. (m 0) 
° (sb_cc<uio_resid) 
MSG DONTWAIT (sb cc<sb lowat) 
(m_nextpkt 0 PR_ATOMIC) 
. 
MSG_WAITALL soreceive 
(uio resid=sb hiwat)[] soreceive 
MSG DONTWAIT sorecevie 
16-42 soreceive 
8. ? 
505-534 soreceive 
505-512 ° (m ) soreceive 

























































































































































































414 
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TCP/IP 2 
(m ) 
MSG_PEEK MSG_PEEK 
513-518 * sosend 
OT dontblock ) soreceive 
release 0 
519-523 soreceive 
dontblock 
524-528 ENOTCONN 
release 
529-534 0 release 0 
EWOULDBLOCK( ) 
: uipc_socket.c 
505 if (so->so_error) { 
506 if (m) 
507 goto dontblock; 
508 error = S0->80 error; 
509 if ((flags & MSG PEEK) == 0) 
510 So-»80 error = 0; 
511 goto release; 
512 ) 
513 if (so-»so state & SS CANTRCVMORE) { 
514 if (m) 
515 goto dontblock; 
516 eise 
517 goto release; 
518 } 
519 for (; m; m = m->m_next) 
520 if (m->m_type == MT_OOBDATA || (m->m_flags & M_EOR)) { 
521 m = so->so_rcv.sb_mb; 
522 goto dontblock; 
523 } 
524 if ((so->so_state & (SS ISCONNECTED | SS ISCONNECTING)) == 0 && 
525 (so->so_proto->pr_flags & PR CONNREQUIRED)) { 
526 error = ENOTCONN; 
527 goto release; 
528 ) 
529 if (uio->uio_resid == 0) 
530 goto release; 
531 if ((so-»so state € SS NBIO) || (flags & MSG DONTWAIT)) { 
532 error = EWOULDBLOCK; ` š 
533 goto release; 
534 ) 
535 Sbunlock(&so-»so rcv); 
536 error - sbwait(&so-»so rcv); 
537 splx(s); 
538 if (error) 
539 return (error); 
540 goto restart; 
541 






































































































































































































































































































































uipc_socket.c 


U 16-42. soreceive (0000000000? 
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9. 
535-541 soreceive ( 
| sbwait sbwait 
soreceive soreceive restart 
sosend SO RCVTIMEO sbwait 
sbwait EWOULDBLOCK 
sb timeo 
soreceive 16-43 
uipc_socket.c 
542 dontblock: 
543 if (uio->uio procp) 
544 uio->uio procp->p stats-»p ru.ru msgrcv++; 
545 nextrecord = m->m nextpkt; i 
546 if (pr->pr flags & PR ADDR) { 
547 orig resid = 0; 
548 if (flags & MSG PEEK) { 
549 if (paddr) 
550 *paddr = m_copy (m, 0, m->m len); 
551 m = m->m next; 
552 } else { 
553 sbfree(&so->so rcv, m); 
554 if (paddr) ( 
555- *paddr = m; 
556 so->so_rcv.sb_mb = m->m_next; 
557 m->m_next = 0; i 
558 m = so->so_rcv.sb_mb; 
559 } else { 
560 MFREE (m, so-»so rcv.sb mb); 
561 m = so-»80 rcv.sb mb; 
562 } 
563 } 
564 } 


10. dontblock 


uipc_socket.c 


DH 16-43 soreceive 0000000090 


















































































































































































































































































































































































































































































































































































































































542-545 nextrecord soreceive 
mbuf 
11. 
546-564 UDP mbu mbu 
*paddr paddr | 
soreceive MSG_PEEK 
16-44 mbu 
12. 
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565-590 mbu ( MSG PEEK 
) *controlp controlp 
S uipc socket.c 
565 while (m && m->m type == MT CONTROL && error == 0) { 
566 if (flags & MSG PEEK) { 
567 if (controlp) 
568 *controlp = m_copy (m, 0, m->m len); 
569 m = m->m next; 
570 ) else { 
571 sbfree(&so->so rcv, m); 
572 if (controlp) { 
573 if (pr-»pr domain-»dom externalize && 
574 mtod(m, struct cmsghdr *)->cmsg type == 
575 SCM RIGHTS) 
576 error - (*pr-»pr domain-»dom, externalize) (m); 
577 *controlp = m; 
578 so->so_rcv.sb_mb = m->m_next; 
579 m->m_next = 0; 
580 m = so->so_rcv.sb_mb; 
581 } else { 
582 MFREE (m, so-»so rcv.sb mb); 
583 m - so-»so rcv.sb mb; 
584 } 
585 } 
586 if (controlp) { 
587 orig_resid = 0; 
588 controlp = &(*controlp)->m. next; 
589 } 
590 } I 
uipc socket.c 


[] 16-44 soreceive 020000009090 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































dom_externalize 
mbu SCM_RIGHTS( ) dom_externalize 
Unix 7.3 
(controlp ) mbu 
mbu 
Unix dom_externalize 
mbuf m mbuf 
mbuf m 0 
16-45 soreceive mbuf 
591 if (m) ( uipc_socket.c 
592 if ((flags & MSG PEEK) == 0) 
593 m->m_nextpkt = nextrecord; 
594 type = m->m_type; 
595 if (type == MT OOBDATA) 
596 flags |= MSG OOB; 
597 } 


TITT TIA e MIDC. socket.c 


O 16-45 soreceive U 000 0 0 O mbuf 
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13. 
591-597 mbu mbuf mbu 
m soreceive while m 
mbuf[] (next record) m mbuf type 
mbu OOB flags MSG_OOB TCP 
MT_OOBDATA MSG_OOB TCP 
16-47 mbu 16-46 
0 E [] U 
moff D MSS_PEEKDDDDDODDDDODDDDOODDODND 
offset [] Msc. PEEK D D D D OOBI] 000000 
uio_resid 0000000 
len DO mbuff] D DDD DD UU UU | uio resid] 0000 00BJO000000 len 
0000 mieng 
U 16-46 soreceive [| DH 0 0 U 
uipc_socket.c 
598 moff = 0; 
599 offset = 0; 
600 while (m && uio->uio resid > 0 && error == 0) { 
601 if (m->m_type == MT_OOBDATA) { 
602 if (type != MT_OOBDATA) 
603 break; 
604 } else if (type == MT_OOBDATA) 
605 break; 
606 so->so_state &= “SS_RCVATMARK; 
607 len = uio->uio_resid; 
608 if (so->so_oobmark && len > so->so_oobmark - offset) 
609 len = so->so_oobmark - offset; 
610 if (len > m-»m len - moff) 
611 len = m->m len - moff; 
612 /* 
613 * If mp is set, just pass back the mbufs. 
614 * Otherwise copy them out via the uio, then free. 
615 * Sockbuf must be consistent here (points to current mbuf, 
616 * it points to next record) when we drop priority; 
617 * we must note any additions to the sockbuf when we 
618 * block interrupts again. 
619 */ 
620 if (mp == 0) { 
621 splx(s); 
622 error = uiomove(mtod(m, caddr t) + moff, (int) len, uio); 
623 s = splnet(); 
624 } else 
625 uio->uio_resid -= len; . 
uipc_socket.c 
[] 16-47 soreceive [] [| [| uiomove 
598-600 while mbu uio 
mbuf 
14. OOB 
600-605 mbu mbu 
TCP 
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15. OOB 
606-611 oobmark oobmark 
mbuf 
TCP 
612-625 uio uiomove mbu 
uio resid 
uiomove 
uiomove 
16-48 mbu 
- uipc_socket.c 
626 if (len == m->m_len - moff) { 
627 if (m->m flags & M_EOR) 
628 flags |= MSG EOR; 
629 if (flags & MSG PEEK) { 
630 m = m->m next; 
631 moff = 0; 
632 } else { 
633 nextrecord = m->m_nextpkt; 
634 sbfree(&so->so rcv, m); 
635 if (mp) { 
636 *mp = M; 
637 mp = &m->m_next; 
638 s0->s0 rcv.sb mb = m = m->m next; 
639 *mp = (struct mbuf *) 0; 
640 } else { 
641 MFREE (m, so->so rcv.sb mb); 
642 m = so->so_rcv.sb_mb; 
643 } 
644 if (m) 
645 m->m_nextpkt = nextrecord; 
646 } 
647 } else { 
648 if (flags & MSG PEEK) 
649 moff += len; 
650 else ( 
651 if (mp) 
652 *mp = m copym(m, 0, len, M WAIT); 
653 m->m data += len; 
654 m->m len -= len; 
655 so->so_rcv.sb_cc -= len; 
656 } 
657 } . 
uipc_socket.c 
U 16-48 soreceive 0000000 
16. mbu 
626-646 mbuf mbuf 
mbuf MSG_EOR MSG_PEEK 
so_receive MSG_PEEK 
uiomove mbu 
mp 
16-49 OOB MSG EOR 
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658 if (so->so_oobmark) { uipc_socket.c 
659 if ((flags & MSG PEEK) == 0) { 

660 so->so_oobmark -= len; 

661 if (so->so_oobmark == 0) { 

662 so->so_state |= SS_RCVATMARK; 
663 break; 

664 } 

665 } else { 

666 offset += len; 

667 if (offset == so->so_oobmark) 

668 break; 

669 } 

670 } 

671 if (flags & MSG_EOR) 

672 break; 





uipc_socket.c 


U 16-49 soreceive 2000000090 










































































































































































































































































































































































































































































































































































































































































































































































17. OOB 
658-670 0 

SS_RCVATMARK soreceive while MSG_PEEK 
offset so_oobmark 

18. 

671-672 soreceive mbu 
16-50 MSG_WAITALL 
uipc_socket.c 

673 /* 
674 * If the MSG_WAITALL flag is set (for non-atomic socket), 
675 * we must not quit until "uio->uio_resid == 0" or an error 
676 * termination. If a signal/timeout occurs, return 
677 * with a short count but without error. 
678 * Keep sockbuf locked against other readers. 
679 */ 
680 while (flags & MSG WAITALL && m == 0 && uio->uio resid > 0 && 
681 !sosendallatonce(so) && !nextrecord) { 
682 if (so->so error || so->so_state & SS_CANTRCVMORE) 
683 break; 
684 error = sbwait(&so-»so rcv): 
685 if (error) ( 
686 Sbunlock(&so-»só rcv); 
687 splx(s); 
688 return (0); 
689 } 
690 if (m = so->so_rcv.sb_mb) 
691 nextrecord = m->m_nextpkt; 
692 } 
693 } /* while more data and more space to fill */ 


uipc_socket.c 


O 16-50 soreceive [] [| [| MSG WAITALL UI 


19. MSG_WAITALL 


420 





TCP/IP 












































673-681 














sosendalla 


MSG_WAITALL 


China-pub.com 














































































































0) 


(m 


























tonce 




























































































(nextrecord ) 
































soreceive 
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soreceive 
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690-692 

















m 








0 





























while 























23. 








mbuf 








nextrecord 





























sbwait 


























(error 

















sbwait 














nextrecord 
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693 





mbu 





























600[] ( 












































16-47) 

































































































































































soreceive 













































































16-51 






























































if (m && pr->pr flags & PR ATOMIC) ( 


uipc_socket.c 

































































































































































































































































































































































































































































695 flags |= MSG_TRUNC; 
696 if ((flags € MSG_PEEK) == 0) 
697 (void) sbdroprecord(&so-»so rcv); 
698 } 
699 if ((flags & MSG_PEEK) == 0) { 
700 if (m == 0) 
701 So-»so rcv.sb mb = nextrecord; 
702 if (pr->pr flags & PR WANTRCVD && so->so_pcb) 
703 (*pr-»pr usrreq) (so, PRU, RCVD, (struct mbuf +) 0, 
704 (struct mbuf *) flags, (struct mbuf *) 0, 
705 (struct mbuf *) 0); 
706 H 
707 if (orig resid == uio-»uio resid && orig resid && 
708 (flags & MSG EOR) == 0 && (so-»so state & SS CANTRCVMORE) == 0) { 
709 sbunlock(&so-»so rcv); 
710 splx(s); 
711 goto restart; 
712 } 
713 if (flagsp) 
714 *flagsp |- flags; 
uipc_socket.c 
O 16-51 soreceive JU 00000 
24. 
694-698 ( ) 
MSG_TRUNC 
recvmsg MSG_TRUNC soreceive 
25. 
699-706 MSG_PEEK mbu 
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26. 
707-712 |] [| soreceive 
uuu soreceive[][l[] restart 
713-714 soreceive *flagsp soreceive 
Soreceive 
( ) ( mbufl] ) 
sosend soreceive 
[Partridge and Pink 1993] UDP [| soreceive 
| i 0 | 
soreceive u y 































































































































































































16.13 select) li 0 
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16-52 select 
select] 000 0 
000000000 . 
listen] [] D] 000000 S 
DU DD DDD D S 
O0O0000000000000000000000 ° 
OO0O0000000 . 
U D D 000 0 . 
ooBJ 000000 ° 
0 16-52 select DD [1 000000 
select[] | L 16-53[] 0 
1. 
390-410 ibits[]obits 
bzero 0 nd 
nd ni 
nd (1 1 ) 256 
(FD SETSIZE)[]falset 32 bit (NFDBITS) nd 65 
ni-howmany (65, 32) X 4=3X 4-12 
howmany (x[] y)[] x Hy 
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tre l 


























390 struct select_args ( sys. ig 
391 u int nd; 
392 fd set *in, "ou, *ex; 
393 struct timeval *tv; 
394 }; 
395 select (p, uap, retval) 
396 struct proc *p; 
397 struct select args *uap; 
398 int *retval; 
399 { 
400 fd set ibits[3], obits[3]; 
401 struct timeval atv; 
402 int s, ncoll, error = 0, timo; 
403 u int ni; 
404 bzero((caddr t) ibits, sizeof(ibits)); 
405 bzero((caddr t) obits, sizeof(obits)); 
406 if (uap->nd > FD SETSIZE) 
407 return (EINVAL); 
408 if (uap-»nd > p-»p fd->fd nfiles) 
409 uap-»nd = p-»p fd->fd nfiles; /* forgiving; slightly wrong */ 
410 ni - howmany(uap-»nd, NFDBITS) * sizeof(fd mask); 
411 #define getbits(name, x) \ 
412 if (uap->name && V 
413 (error = copyin((caddr t)uap-»name, (caddr t)&ibits[x]l, ni))) A 
414 goto done; 
415 getbits(in, 0); 
416 getbits(ou, 1); 
417 getbits(ex, 2); 
418 #undef getbits 
419 if (uap->tv) { 
420 error = copyin((caddr_t) uap->tv, (caddr_t) & atv, 
421 sizeof (atv)); 
422 if (error) 
423 goto done; 
424 if (itimerfix(&atv)) { 
425 error = EINVAL; 
426 goto done; 
427 } 
428 S = splclock(); 
429 timevaladd(&atv, (struct timeval *) &time); 
430 timo = hzto(&atv); 
431 /* 
432 * Avoid inadvertently sleeping forever. 
433 */ 
434 if (timo == 0) 
435 . timo - 1; 
436 splx(s); 
437 ) else 
438 timo = 0; I i 
sys generic.c 
O 16-53 select U D] LH D] LU 
2. 
411-418  getbits copyin ibits 
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419-438 tv timeo O[] select tv 
itimerfix timevaladd 
hzto timo 
0 timeo|[] 1 select O[] timeval 
















































































































































































































































































select 16-54 




























































































































































































439 ans. TI sy generic.c 


439 retry: 

440 ncoll - nselcoll; 

441 p-»p flag |= P SELECT; 

442 error = selscan(p, ibits, obits, uap->nd, retval); 

443 if (error || *retval) 

444 goto done; 

445 s = splhigh(); 

446 /* this should be timercmp(&time, &atv, >=) */ 

447 if (uap->tv && (time.tv sec > atv.tv sec [| 

448 time.tv sec == atv.tv sec && time.tv_usec >= atv.tv usec)) { 
449 splx(s); 

450 goto done; 

451 ) : 

452 if ((p-»p flag & P SELECT) -- 0 || nselcoll !- ncoll) ( 
453 splx(s); 

454 . goto retry; 

455 H 

456 p-»p flag &- ^P SELECT; 

457 error - tsleep((caddr t) & selwait, PSOCK | PCATCH, "select", timo); 
458 splx(s); 

459 if (error == 0) 

460 goto retry; 

461 done: 

462 p->p_flag &= "P SELECT; 

463 /* select is not restarted after signals... */ 

464 if (error == ERESTART) 

465 error = EINTR; 

466 if (error == EWOULDBLOCK) 

467 error = 0; 

468 #define putbits(name, x) \ 

469 if (uap->name && \ 

470 (error2 = copyout((caddr t)&obits[x], (caddr t)uap-»name, ni))) A 
471 error = error2; : 
472 if (error == 0) { 

473 int error2; 

474 putbits(in, 0); : 

475 putbits(ou, 1); 

476 putbits(ex, 2); 

477 #undef putbits 

478 } 

479 return (error); 

480 } 





U 16-54 select [] HU B U D D 


























































































































































































































439-442 retry select 
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nselcoll P_SELECT selscan([] 16-55) 
select 
selscan 
— - sys generic.c 
481 selscan(p, ibits, obits, nfd, retval) 
482 struct proc *p; 
483 fd set *ibits, *obits; 
484 int nfd, *retval; 
485 I 
486 struct filedesc *fdp = p->p_fd; 
487 int msk, i, j, £d; 
488 fd mask bits; 
489 struct file *fp; 
490 int n = 0; 
491 static int flag[3] = 
492 {FREAD, FWRITE, 0}; 
493 for (msk = 0; msk < 3; msk++) { 
494 for (i = 0; i < nfd; i += NFDBITS) { 
495 bits = ibits[msk].fds bits[i / NFDBITS]; 
496 while ((j = ffs(bits)) && (fd = i +.--j) < nfd) { 
497 o bits &= "(1 << j); ' 
498 fp = fdp->fd_ofiles[fd]; 
499 if (fp == NULL) 
500 return (EBADF); . 
501 if ((*fp->f ops->fo select) (fp, flag[msk], p)) ( 
502 FD SET(fd, &obits[msk]); 
503 net; 
504 } 
505 } 
506 ] 
507 } 
508 *retval = n; 
509 return (0); 
510 } P 
— sys generic.c 
O 16-55 selscan [] [] 
5. 
443-444 
6. 
445-451 
Së selscan 
452-455 selscan P_SELECT 
nselcoll selscan 
8. 
456-460 select tsleep selwait 16- 
60 tsleep 
select retry 
9. 
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461-480 done P_SELECT ERESTART EINTR 
EWOULDBLOCK 0 select 
EINTR 0 































































































16.13.1 selscan 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































select | 16-55 selscan 
selscan | |] 
so select soo select 
1. 
481-496 for for 
| 32 bit(NFDBITS) 
while 32 bit 
bits ffs bits 
bits 1000 ( 2810) ffs (bits) 4 
2. 
497-500 ill ffs fd bits 
( ) file 
fo select 
fo select flag msk for 
FREAD FWRITE 
0 EBADF 
3. 
501-504 
n( JE 1 
505-510 | | | | | *retval 
16.13.2 soo, select 
selscan selscan 
fileops ( 15.5[] ) fo select 
16-56 Soo select 
sys socket.c 


105 soo_select (fp, which, p) 
106 struct file *fp; 


107 int which; 

108 struct proc *p; 

109 ( 

110 struct socket *so = (struct socket *) fp->f data; 
111 int ` s = splnet(); 

112 switch (which) ( 

113 case FREAD: 

114 if (soreadable(so)) ( 


O 16-56 soo select [| [J 












































426 "uu: China"pub.tom 
A A 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































115 splx(s); 
116 return (1); 
117 } 
118 selrecord(p, &so->so_rcv.sb_sel); 
119 so->so_rcv.sb_flags |= SB_SEL; 
120 break; 
121 case FWRITE: 
122 if (sowriteable(so)) { 
123 spix(s); 
124 return (1); 
125 } 
126 selrecord (p, &so->so_snd.sb_sel); 
127 so->so_snd.sb_flags |- SB_SEL; 
128 break; 
129 case 0: | 
130 if (so->so_oobmark || (so->so_state & SS_RCVATMARK)) ( 
131 splx(s); 
132 return (1); 
133 ) 
134 selrecord(p, &so->so_rcv.sb_sel); 
135 so->so_rcv.sb_flags |= SB SEL; 
136 break; 
137 ) 
138 splx(s); 
139 return (0); 
140 ) 
sys socket.c 
O 16-56 (O) 
105-112 soo select which 
1 selrecord 
soo select 0 
16-520 00 E | E soo select[] soreadable 
Sowriteable sys/socketvar.h 
1. 
113-120 soreadabl ef 
#define soreadable(so) \ 
((so)-»so rcv.sb cc >= (so)->so_rcv.sb_lowat || * 
((so)->so_state & SS CANTRCVMORE) || \ 
(so) ->so_qlen | (so) ->so_error) 
UDP[] TCP 1 ([] 16-4) 
2. 
121-128 sowriteable 
#define sowriteable(so) \ 
(sbspace (& (so) ->so_snd) >= (so)->so_snd.sb_lowat KK \ 
(((so)-»so state&SS ISCONNECTED) || ^ 
((so)-»so proto-»pr flags&PR CONNREQUIRED)==0) || \ 
((so)-»so state & SS CANTSENDMORE) || \ 


(so)-»so error) 















































TCP[] UDP 2048 UDP sowriteable 
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sbspace sb_hiwat so_lowat 
TCP 2048 
16-52 
3. 
129-140 so oobmark[| SS_RECVATMARK 



































































































































































































































16.13.3 selrecord 


































































































































































































16-57 selinfo (O 16-3 sb sel 
) 
41 struct selinfo ( select.h 
42 pid t Si pid; /* process to be notified */ 
43 short Si flags; /* 0 or SI COLL */ 


44 y; 
G — a —— EE 


0 16-57 selinfo U [| 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































41-44 select sl_pid 
select sl_flags SI_COLL 
sl flags 
soo select selrecord 16-58 
S generic.c 
522 void Sys. 8! 
523 selrecord(selector, sip) 
524 struct proc *selector; 
525 struct selinfo *sip; tb 
526 { 
527 Struct proc *p; 
528 pid_t mypid; 
529 mypid = selector->p_pid; 
530 if (sip->si_pid == mypid) 
531 return; 
532 if (sip->si_pid && (p = pfind(sip->si_pid)) && 
533 p->p_wchan == (caddr_t) & selwait) 
534 sip->si_flags |= SI COLL; 
535 else 
536 sip->si pid = mypid; 
537 } . 
Sys generic.c 
O 16-58 selrecord [] O 
1. 
522-531 selrecord select proc 
selinfo so_snd.sb_sel|| so_rcv.sb_sel 
selinfo select 
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China=pu 









































HI 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
2. ? 
532-534 select SI_COLL 
3. 
535-537 Si pid 0 | U 
Si pid 
16.13.4 selwakeup 
Net/3 
selinfo 
( SI COLL)[] Net/3 
n 16-54 | | 
select tsleep selwait 
wakeup select — 
16-59 selwakeup 
OOB[| O00 uat uae 
O 16-59 selwakeup [J [J 
LU U LU | | | 16-59 0 0 
16-59 selwakeup 
selwakeup 16-60 
541-548 si_pid 0 ODO select 
549-553 select nselcol1[] 1 
select 16-54 tsleep 
nselcoll select uuu (O O 16.9) 
554=567 si pid selwait 
P_SELECT selrecord 
selscan 
EBADF selinfo selwakeup selwakup 
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sel_pid selinfo 
( ) 
selwakeup nselcoll 0 
select 
541 void sys generic.c 
542 selwakeup(sip) 
543 struct selinfo *sip; 
544 ( 
545 struct proc *p; 
546 int S; 
547 if (sip-»si pid == 0) 
548 return; 
549 if (sip->si flags & SI COLL) { 
550 nselcoll++; 
551 sip->si_flags &= “SI COLL; 
552 wakeup((caddr t) & selwait); 
553 } 
554 p = pfind(sip->si pid); 
555 sip->si_pid = 0; 
556 if (p != NULL) { 
557 s = splhigh(); 
558 if (p->p_wchan == (caddr_t) & selwait) { 
559 if (p->p_stat == SSLEEP) 
560 setrunnable (p); 
561 else 
562 unsleep (p); 
563 } else if (p-»p flag & P, SELECT) 
564 p->p_flag &- ^P SELECT; 
565 splx(s); 
566 ) 
567 ) l 
sys generic.c 
U 16-60 selwakeup [| J] 
16.14 ID 
sosend soreceive 

















































































































































































































































































































select 




















































































































































































































































































































select 
























































U U 


16.1 write 























































































































































































































430 us no China-pub.com 
TT 


sosend[] [| resid[] U [| [| 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































16.2 [] sosend[] [] [| MCLBYTES) 000000000000 space [] MCLBYTES 

OD 0 LU | [| atomic O U mbuf| OO! 0 
? 
16.3 0 0 0 [|] sosend[] soreceivel O O 
U | OU OU 
? 

16.4 PR_ATOMIC O O 0o O UD O 

0 MSG, EOR[] OG 0 
0 2 

16.5 00090 | 00000 MSG DONTWAIT[][] 
sosend| | L UT TT TT TT I O 2 

16.6 0 Sb cc«sb hiwat sbspace | | ?| 
M g? 

167 000 reevit| ual | Ú IO 7 

16.8 soreceive[] [| [| MSG EoR[] 

16.9 [] nselcoll [| select[] selwakeup[] [] ? 

16.10 select 000 select] J Uu U 








































































































Ahiaska 


Ui 00 00 


171 DD 

















































































































































































































































































































































































































































































































































































































setsockopt[] getsockopt 8.8[] O00 0 IP 
ioctl 4.4 4.4 
ioctl 6.7 
IP ioctl ioctl fentl 
[| getsockname|| getpeername LI LI Li 


































































































17-1 U 0 











































































































































tcp_ctloutput rip_ctloutput 


ip_ctloutput 


O 17-1 setsockopt [| getsockopt 0000 


17.2 0000 






























































































































































17-2 
0 0 O [] U 
kern/kern descrip.c fcnt1[] OOO 
kern/uipc_syscalls.c setsockopt[] getsockopt[] getsockname[] getpeername[] [I [1 [] 
kern/uipc socket.c OOOO setsockopt[] getsockopt [1 [] 
kern/sys socket.c ioctl[] 000000000 
01172 00000000 
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565-597 








int setsockopt (int s, 


| U O setsockopt 000000 
getsock[] [JO U U 
000000 





17-4 

















int level, 




















[] filel] 








int optname, void *optval, 


000 





[] val] [J 


int optlen) ; 

















m get[] [] [] mburi 0 O O 








O 


0000060 


U U U 


[] valsizel] 


TCP/IP] U [] 20 
| U 
dut LU U U U U U U U U UD U U U U U (U (U LU U U U 
17.3 setsockopt|| [|] [| [] 
8-29] J U U 0 setsockopt ([] getsockopt) || 
SOL SOCKET 17-3 
optname optval [] [] [] [] [] O 
SO_SNDBUF int so_snd.sb_hiwat 0000000090 
SO_RCVBUF int so_rcv.sb_hiwat 00000000 
SO_SNDLOWAT int so_snd.sb_lowat 0200000000 
SO_RCVLOWAT int so_rcv.sb_lowat 0000000090 
SO SNDTIMEO struct timevalso snd.sb timeo 00000 
SO_RCVTIMEO struct timevalso_snd.sb_timeo 00000 
SO_DEBUG int so_options 0400000 
SO_REUSEADDR int so_options OOO00000000000 
SO REUSEPORT int so options p4g40000000000 
SO_KEEPALIVE int so_options 0000000090 
SO_DONTROUTE int so_options 0000 
SO_BROADCAST int so_options U U 00 0 U 
SO_USELOOPBACK | int so_options OOO0000000000000000 
U D D 
SO_OOBINLINE int so_options 000000000090 
SO LINGER struct linger so linger 000000000000 
SO ERROR int so error 000000000000 0 getsockopt 
SO TYPE int so type 0000000000 getsockopt 
un [] ] ENOPROTOOPT 
O 17-3 setsockopt [| getsockopt UI 
setsockopt 000090 




















O MLEN[] D 





















































valsize|| 























OMLEnND H 0 0 EINVAL 





565 struct setsockopt_args { 


566 
567 
568 
569 
570 
571 1; 


int 
int 
int 


int 


572 
573 
574 


575 int 


s; 
level; 
name; 


caddr_t val; 


valsize; 


setsockopt p, uap, retval) 
struct proc *p; 

struct setsockopt_args *uap; 
*retval; 


DO 17-4 setsockopt 








U sosetopt|| 


0000 



































U U U UU U 


uipc_syscalls.c 
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576 ( 
577 struct file *fp; 
578 struct mbuf *m = NULL; 
579 int error; 
580 if (error = getsock(p-»p fd, uap->s, &fp)) 
581 return (error); 
582 if (uap->valsize > MLEN) 
583 return (EINVAL); 
584 if (uap->val) { 
585 m = m get (M WAIT, MT SOOPTS); 
586 if (m == NULL) 
587 return (ENOBUFS); 
588 if (error = copyin(uap->val, mtod(m, caddr t), 
589 (u int) uap->valsize)) { 
590 (void) m free(m); 
591 return (error); 
592 } 
593 m->m_len = uap->valsize; 
594 } 
595 return (sosetopt ((struct socket *) fp->f data, uap->level, 
596 uap->name, m)); 
597 3 
— O—uipc_svscalls.c 
117-4 (0) 
sosetopt 
sosetopt 
pr_ctloutput 17-5 sosetopt 











uipc_socket.c 


752 sosetopt (so, level, optname, m0) 
753 struct socket *so; 


754 int level, optname; 

755 struct mbuf *m0; 

756 { 

757 int error = 0; 

758 struct mbuf *m = m0; 

759 if (level != SOL SOCKET) I 

760 if (so->so_proto && so->so_proto->pr_ctloutput) 

761 return ((*so->so_proto->pr_ctloutput) 

762 (PRCO SETOPT, so, level, optname, &m0)); 
763 error = ENOPROTOOPT; ` 
764 } else { 

765 switch (optname) { 





841 default: 

842 error = ENOPROTOOPT; 

843 break; 

844 } 

845 if (error == 0 && so->so_proto && so-»so proto-»pr, ctloutput) { 
846 (void) ((*so->so_proto->pr_ctloutput) 

847 (PRCO_SETOPT, so, level, optname, &m0)); 


O 17-5 sosetopt UI 
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TCP/IP [] 2 
848 m = NULL; /* freed by protocol */ 
849 } 
850 } 
851 bad: 
852 if (m) 
853 (void) m free(m); 
854 return (error); 
855 ] o 
uipc_socket.c 
117-5 (0) 
752-764 (SOL_SOCKET) PRCO_SETOPT 
pr_ctloutput pr usrreg 17-6 
Internet pr_ctloutput 
[] pr. ctloutput[] [] O O 
UDP ip_ctloutput O 8.80 
TCP tcp_ctloutput O 30.60 
ICMP 
IGMP rip_ctloutput[] ip_ctloutput 0 8.80 0 O 32.80 
OM IP 
DH 17-6 pr ctloutput [| [| 
765 switch GOGL 
841-844 o mbu ENOPROTOOPT 
845-855 switch switch 
Internet[] | 
pr_ctloutput 
m m_free 
17-7 | linger | 
766-772 linger lingerl] |] 
struct linger { 
int 1 onoff; /* option on/off */ 
int 1 linger; /* linger time in seconds */ 
y; 
[] linger 1 linger [] | 
so linger case[] so linger[| close 
15.15 
773-789 0 0 
( ) mbuf| 
17-8 uli 
790-815 if 
SO SNDBUF[] SO. RCVBUF[] sbreserve[] 
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SO SNDLOWAT|| SO RCVLOWAT 
















































































766 case SO LINGER: uipe socket.c 
767 if (m == NULL || m-»m len !- sizeof(struct linger)) { 
768 error - EINVAL; 
769 goto bad; 
770 } 
771 so->so_linger = mtod(m, struct linger *)-»1 linger; 
772 /* fall thru... */ 
773 case GO DEBUG: 
774 case 50 KEEPALIVE: 
775 case SO DONTROUTE: 
776 case SO USELOOPBACK: 
777 case SO_BROADCAST: 
778 case SO_REUSEADDR: 
779 ` case SO REUSEPORT: 
780 case SO_OOBINLINE: 
781 if (m == NULL || m-»m len < sizeof(int)) ( 
782 error = EINVAL; 
783 goto bad; 
784 ) 
785 if (*mtod(m, int *)) 
786 so->so options |= optname; 
787 else 
788 s0->so options &= ”optname; 
789 break; 
uipc_socket.c 
O 17-7 sosetopt JO [| linger [0000 
uipc_socket.c 
790 case SO_SNDBUF: 
791 case 50 RCVBUF: 
792 case SO SNDLOWAT: 
793 case SO RCVLOWAT: 
794 if (m == NULL || m-»m len « sizeof(int)) { 
795 error - EINVAL; 
796 goto bad; 
797 } 
798 switch (optname) { 
799 . case SO_SNDBUF: 
800 case SO_RCVBUF: 
801 if (sbreserve (optname == SO_SNDBUF ? 
802 £so->so_snd : &so-»so rcv, 
803 (u long) * mtod(m, int *)) == 0) í 
804 error - ENOBUFS; : 
805 goto bad; 
806 } 
807 break; 
808 case SO_SNDLOWAT: 
809 so->so_snd.sb_lowat = *mtod(m, int *); 
810 break; 
811 case SO_RCVLOWAT: 
812 so->so_rcv.sb_lowat = *mtod(m, int *); 
813 break; 
814 } 
815 break; M 
uipc_socket.c 


0 17-8 sosetopt O [00000000 
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17-9 
uipc_socket.c 
816 case SO_SNDTIMEO: 
817 case SO_RCVTIMEO: 
818 { 
819 struct timeval *tv; 
820 short val; 
821 if (m == NULL || m->m_len < sizeof(*tv)) { 
822 error = EINVAL; 
823 goto bad; 
824 } 
825 tv = mtod(m, struct timeval *); 
826 if (tv->tv_sec > SHRT_MAX / hz - hz) { 
827 error = EDOM; 
828 goto bad; 
829 } 
830 val = tv->tv_sec * hz + tv->tv_usec / tick; 
831 switch (optname) { 
832 case SO_SNDTIMEO: 
833 so->so_snd.sb_timeo = val; 
834 break; 
835 case SO RCVTIMEO: 
836 so->so rcv.sb timeo = val; 
837 break; 
838 } 
839 break; 
840 } ; 
uipc_socket.c 
17-9 sosetopt [100000 
816-824 timeval SO SNDTIMEO[|| SO_RCVTIMEO 
EINVAL 
825-830 timeval sb timeo 
826 
tv usec 
tv_secxhz+ — > SHRT MAX 
tick 





ticck-1 000 000/H&HRT MAX=32767 























































































































SHRT_MAX tv_usec SHRT_MAX tv_usec 

> ——Ə— — — _ = —vsE— — —J 

GEES hz tickxhz hz 100000 
hz 


















































































































































if (tv->tv sec * hz+tv->tv_usec/tick>SHRT_MAX) 
error=EDOM; 













































































































































































































































































































































































































































































17.3 
831-840 | vall |] 0 sb timeo 
| | U U 0 16.70) 16.11 
tsleep tsleep 
65535 100 Hz 11 
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17.4 getsockopt U 0 



































































































































getsockopt 





int getsockopt (int s, int level, int name, caddr t val, int *valsize) ; 


17-10 



















































































uipc_syscalls.c 
598 struct getsockopt_args { 


599 int s; 

600 int level; 
601 int name; 

602 caddr_t val; 

603 int *avalsize; 
604 ); 


605 getsockopt (p, uap, retval) 
606 struct proc *p; 
607 struct getsockopt_args *uap; 






















































































































































































































































































































































































































































































































































































































































































608 int *retval; 
609 1 
610 struct file *fp; 
611 struct mbuf *m = NULL; 
612 int valsize, error; 
613 if (error = getsock(p->p_fd, uap->s, &fp)) 
614 return (error); 
615 if (uap->val) { y 
616 if (error = copyin((caddr_t) uap->avalsize, (caddr_t) & valsize, 
617 sizeof (valsize))) 
618 return (error); : 
619 ) else 
620 valsize - 0; 
621 if ((error = sogetopt((struct socket *) fp->f data, uap->level, 
622 uap->name, &m)) == 0 && uap->val && valsize && m != NULL) ( 
623 if (valsize > m->m len) 
624 valsize = m->m len; 
625 error = copyout (mtod(m, caddr t), uap->val, (u int) valsize); 
626 if (error == 0) 
627 error = copyout((caddr t) & valsize, 
628 (caddr t) uap->avalsize, sizeof (valsize)); 
629 } 
630 if (m != NULL) 
631 (void) m_free (m); 
632 return (error); 
633 } l . 
uipe_syscalls.c 
0 17-10 getsockopt JO OD 
598-633 getsock file 
sogetopt sogetopt 
mbu 
sogetopt 
sosetopt sogetopt 
17-11 sogetopt 
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TCP/IP 
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- uipc_socket.c 
856 sogetopt (so, level, optname, mp) 
857 struct socket *so; ji 
858 int level, optname; 
859 struct mbuf **mp; 
860 { 
861 struct mbuf *m; 
862 if (level != SOL_SOCKET) { 
863 if (so->so_proto && so->so_proto->pr_ctloutput) { 
864 return ((*so->so_proto->pr_ctloutput) 
865 (PRCO_GETOPT, so, level, optname, mp)); 
866 } else 
867 return (ENOPROTOOPT); 
868 } else { 
869 m = m_get (M_WAIT, MT SOOPTS); 
870 m->m_len = sizeof (int); 
871 switch (optname) { 
918 default: 
919 (void) m_free(m); 
920 return (ENOPROTOOPT); 
921 } 
922 *mp = m; 
923 return (0); 
924 } 
925 T a 
uipc_socket.c 
U 17-11 sogetopt 00000 
856-871 sosetopt 
PRCO_GETOPT mp mbu 
mbuf 
m_len switch mbu 
918-925 switch default mbuf 
ENOPROTOOPT switch mbuf *mp 
getsockopt mbu mbu 
17-12 SO_LINGER 
872-877 SO_LINGER 1_onoff 
1_linger 
878-887 so options[| optname 
0 0 
1 
sogetopt (O 17-13) mbuf] 
888-906 mbu 
( ) so error mbu 
so error getsockopt 
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uipc socket.c 
872 case SO LINGER: 
873 m-»m len - sizeof(struct linger); 
874 mtod(m, struct linger *)->1_onoff = 
875 so->so_options & SO LINGER: 
876 mtod(m, struct linger *)->1 linger = so->so_linger; 
877 break; 
878 case SO_USELOOPBACK: 
879 case SO_DONTROUTE: 
880 case SO_DEBUG: 
881 case SO_KEEPALIVE: 
882 case SO REUSEADDR: 
883 case SO REUSEPORT: 
884 case SO BROADCAST: 
885 case SO OOBINLINE: 
886 *mtod(m, int *) - so-»so options & optname; 
887 break; 
uipc_socket.c 
0 17-12 sogetopt 0 0 0 sommer JO 00000 
uipc socket.c 
888 case SO TYPE: 
889 *mtod(m, int *) = so->so type; 
890 break; 
891 case SO_ERROR: 
892 *mtod(m, int *) = so->so error; 
893 so->so error = 0; 
894 . break; 
895 case SO_SNDBUF: 
896 *mtod(m, int *) = so->so_snd.sb_hiwat; 
897 break; 
898 case SO_RCVBUF: 
899 *mtod(m, int +) = so-»so rcv.sb hiwat; 
900 break; 
901 case SO SNDLOWAT: ° 
902 *mtod(m, int *) = so->so_snd.sb_lowat; 
903 break; 
904 case SO RCVLOWAT: 
905 *mtod(m, int *) = so->so_rcv.sb_lowat; 
906 break; 
uipc_socket.c 
U 17-13 sogetopt OOOO D LI LI D 
uipc socket.c 
907 case SO SNDTIMEO: 
908 case SO RCVTIMEO: 
909 ( 
910 int val = (optname == SO SNDTIMEO ? 
911 s0->so snd.sb timeo : so-»so rcv.sb timeo); 
912 m-»m len - sizeof(struct timeval); 
913 mtod(m, struct timeval *)-»tv sec = val / hz; 
914 mtod(m, struct timeval *)->tv_usec = 
915 (val $ hz) / tick; 
916 break; 
917 } 
uipc_socket.c 





0 17-14 sogetopt D DO D D U 0 
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TCP/IP 2 
17-14 sogetopt SO_SNDTIMEO 
SO_RCVTIMEO 
907-917 sb_timeo var val 
mbuf[] timeval 
tv_usec{] [| L | | "(val $ hx* tick 
17.5 penti iocti[][]D D 
API loctl fcntl 
ioctl fcntl 
17-15 
















































































ioctl 





int ioctl(int fd, unsigned 
int fcntl(int fd, int cmd,... 

















DÅ 






udp usrreg 


D 17-15 fentl H ioctl DD 





fcntl [] 






































long result, char *argp); 


/* int arg */); 
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17-16 17-16 
Posix O_NONBLOCK 
FNONBLOCK O_ASYNC FASYNC 
[ O fcntl ioctl 

0000000 so state [ SS NBIO | FNONBLOCK[ 00000 FIONBIO[ [| 
U000 0000000 

0000000 sb flags [ sBasvwc| FASYNCOH U 0000 FIOASYNC[] [] 
O00000000000 

00000 so pgid] 0 0 sIGIoc] F_SETOWN[] F_GETOWN SIOCSPGRP[] SIOCGPGRP[] J] 

stcuRGOOOOOO00000 

O0000000000000 FIONREAD 
so rev.sb cc 

000080000090 so state] [0 SIOCATMARK 
SS RCVATMARK[] [] 

















O 17-16 fentl [] iocti [] U 





17.5.1 fentl 


































































































































































































































































































































































































17-17 fcntl 
kern descrip.c 
133 struct fcntl args ( 
134 int fd; 
135 int cmd; 
136 int arg; 
137 As 
138 /* ARGSUSED */ 
139 fentl(p, uap, retval) 
140 struct proc *p; 
141 struct fcntl args *uap; 
142 int *retval; 
143 ( 
144 Struct filedesc *fdp - p-»p fd; 
145 Struct file *fp; 
146 struct vnode *vp; 
147: int i, tmp, error, flg = F_POSIX; 
148 struct flock fl; 
149 u int newmin; 
150 if ((unsigned) uap->fd >= fåp->fd nfiles || 
151 . (fp = fdp->fd_ofiles[uap->fd]) == NULL) 
152 return (EBADF); 
153 Switch (uap->cmd) { 
um RES 

253 default: 
254 return (EINVAL); 
255 } 
256 /* NOTREACHED */ 
i kern_descrip.c 


H 17-17 so 0000000 
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TCP/IP 2 
133=153 switch 
253=257 fcntl EINVAL 
17-18 fcntl 
kern descrip.c 
168 case F_GETFL: 
169 *retval = OFLAGS(fp->f flag); 
170 return (0); 
171 case F_SETFL: 
172 fp->f flag &= ~FCNTLFLAGS; ` 
173 fp->f_flag |- FFLAGS(uap->arg) & FCNTLFLAGS; 
174 tmp = fp->f flag & FNONBLOCK; 
175 error = (*fp->f ops-»fo ioctl) (fp, FIONBIO, (caddr t) & tmp, p); 
176 if (error) 
177 return (error); 
178 tmp = fp->f flag & FASYNC; 
179 error = (*fp->f ops->fo ioctl) (fp, FIOASYNC, (caddr t) E tmp, p); 
180 if (lerror) - 
181 return (0); 
182 fp->f flag &= ~FNONBLOCK; 
183 tmp = 0; 
184 (void) (*fp->f ops->fo ioctl) (fp, FIONBIO, (caddr_t) & tmp, p); 
185 return (error); 
186 case F_GETOWN: 
187 if (fp->f type == DTYPE_SOCKET) { 
188 *retval = ((struct socket +) fp->f data)->so pgid; 
189 return (0); 
190 ) 
191 error = (*fp->f ops-»fo ioctl) 
192 (fp, (int) TIOCGPGRP, (caddr_t) retval, p); 
193 *retval = -*retval; 
194 return (error); 
195 case F_SETOWN: 
196 if (fp->f type == DTYPE SOCKET) { 
197 ((struct socket +) fp->f data)-»so pgid = uap->arg; 
198 return (0); 
199 ) 
200 if (uap->arg <= 0) ( 
201 uap->arg = -uap->arg; 
202 } else { 
203 struct proc *pl = pfind(uap->arg); 
204 if (pl == 0) 
205 return (ESRCH); 
206 uap->arg = pl->p_pgrp->pg_id; 
207 } 
208 return ((*fp->f_ops->fo_ioctl) 2 
209 (fp, (int) TIOCSPGRP, (caddr_t) & uap->arg, p)); 2 
kern_descrip.c 
[] 17-18 fett IJ 00000000 
168-185 F_GETFL F_SETFL 
fo ioctl[| FNONBLOCK|| FASYNC 










































































17-20 



















































































soo_ioctl fo_ioctl 






























































fo_ioctl FNONBLOCK 
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186-194 F GETOWN so pgid 
TIOCGPGRPi oct Å | fo ioctl F SETOWN 

























































































































































































So pgid | 














17.5.2 ioct1[][] 













































































loctli soo ioctl | 17-20 
ioctl 17-17 soo ioctl 






























































































































































































































































rtioctl ifioctl 



























































pr usrreq 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































55-68 soo ioctl *data FIONBIO 
| accept 
connect|| close 
69-79 FIOASYNC VO SS_ASYNC 
sowakeup SIGIO 
80-88 FIONREAD SIOCSPGRP 
SIOCGPGRP so_pgid SIGIO 
SIGURG 
89-92 SIOCATMARK 
ioctl FIOxxx|] SIOxxx 17-19 
























































































































































13 bits 8 bits 8 bits 
[117519 seer [DET DL D D EL D 


55 soo ioctl(fp, cmd, data, p) 
56 struct file *fp; 

57 int cmd; 

58 caddr t data; 

59 struct proc *p; 


60 ( 

61 struct socket *so = (struct socket *) fp->f data; 
62 switch (cmd) ( i 
63 . case FIONBIO: 

64 if (*(int *) data) 

65 so->so_state [= SS_NBIO; 

66 else 

67 so->so_state &= "SS_NBIO; 

68 return (0); 

69 case FIOASYNC: 

70 if (*(int *) data) { 

71 so->so_state |= SS_ASYNC; 

72 so->so_rcv.sb_flags |- SB ASYNC; 


O 17-20 soo ioctl [| JJ 
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so->so_snd.sb_flags |- SB. ASYNC; 













































































































































































































































































































































































































































































































































































































































































































































































































































































73 
74 ) else ( 
75 SOo-»SO State &= "SS ASYNC; 
76 So-»so rcv.sb flags &= "SB ASYNC; 
77 So-»80, snd.sb flags &= "Sp ASYNC; 
78 } i 
79 return (0); 
80 case FIONREAD: 
81 *(int *) data = so-»so rcv.sb cc; 
82 return (0); i 
83 case SIOCSPGRP: I 
84 so->so_pgid = *(int *) data; 
85 return (0); 
86 case SIOCGPGRP: 
87 *(int *) data = so->so_pgid; 
88 return (0); 
89 case SIOCATMARK: 
90 *(int *) data = (so->so_state & SS_RCVATMARK) != 0; 
91 return (0); 
92 } 
93 /* 
94 * Interface/routing/protocol specific ioctls: 
95 * interface and routing ioctls should have a | 
96 * different entry since a socket's unnecessary 
97 */ : 
98 if (IOCGROUP (cmd) == 'i') 
99 return (ifioctl(so, cmd, data, p)); 
100 if (IOCGROUP (cmd) == ’r’) 
101 return (rtioctl(cmd, data, p)); 
102 return ((*so->so_proto->pr_usrreq) (so, PRU CONTROL, 
103 (struct mbuf *) cmd, (struct mbuf *) data, (struct mbuf *) 0)); 
104 } 
sys socket.c 
0 17-20 (0) 
ioctl 
input output 
votd IOCPARM_LEN (cmd) O O cmd [| length 
IOCBASECMD (cmd) length] 0 OU D 
length ( ) TOCGROUP (cmd) 0 D cmdQ O group 
group 
. D 17-21 iseti [I [JD 
number 17-21 ioctl 
93-104 IOCGROUP 8 bit[] group ifioctl 
rtioctl PRU CONTROL 
19 Net/2 
PF ROUTE 
ioctl rtioctl ENOTSUPP 




























































































































































































17.6 getsockname[] [ 00 


getsockname 

































































Chinaspub.toN ji 445 












































int getsockname (int fd, caddr t asa, int * alen); 





















































getsockname fd asa 
bind 

















































































































































































































































































































(2.2.5[] ) getsockname 17-22 







































































uipc_syscalls.c 
682 struct getsockname_args { PE sy 


683 int fdes; 
684 caddr t asa; 
685 int *alen; 
686 ); 


687 getsockname(p, uap, retval) 
688 struct proc *p; 
689 struct getsockname args *uap; 


690 int *retval; 

691 I 

692 struct file *fp; 

693 struct socket *so; 

694 struct mbuf *m; 

695 int len, error; 

696 if (error = getsock(p->p_fd, uap->fdes, &fp)) 

697 return (error); 

698 if (error = copyin((caddr t) uap->alen, (caddr t) & len, sizeof(len))) 
699 return (error); : 

700 so = (struct socket *) fp->f_data; 

701 m = m getclr(M WAIT, MT SONAME); 

702 if (m == NULL) 

703 return (ENOBUFS); 

704 if (error = (*so->so_proto->pr_usrreg) (so, PRU_SOCKADDR, 0, m, 0)) 
705 goto bad; 

706 if (len > m->m len) 

707 len = m->m len; f 

708 error = copyout (mtod(m, caddr_t), (caddr t) uap->asa, (u_int) len); 
709 if (error == 0) 

710 error = copyout((caddr_t) & len, (caddr_t) uap->alen, 

711 sizeof(len)); 

712 bad: 

713 m freem(m); 

714 return (error); 


715 ] ; 
III tp" syscalls.c 





























































































































































































































































































































































































































































































































[ 17-22 getsockname [] 0 0 
682-715 getsock file len 
m_getclr mbu bzero 
PRU_SOCKADDR m 
*alen 
mbu 














































































































17.7 getpeername | [] [J 



























































getpeername 





int getpeername (int fd, caddr t asa, int *alen); 
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getpeername accept 
fork[] exec ( inetd ) 
accept getpeername 
TP4 TP4 
accept 
getpeername 
TCP TCP accept 17-23 
getpeername 























719 struct getpeername args ( 


720 
721 
722 
723 }; 












































uipc syscalls.c 


int fdes; 
caddr t asa; 
int *alen; 


724 getpeername(p, uap, retval) 
725 struct proc *p; 
726 struct getpeername args *uap; 















































































































































































































































































































































727 int *retval; 
728 ( 
729 struct file *fp; 
730 Struct socket *so; 
731 struct mbuf *m; 
732 int len, error; 
733 if (error = getsock(p-»p fd, uap->fdes, &fp)) 
734 return (error); 
735 so = (struct socket *) fp->f data; 
736 if ((so-»so state & (SS ISCONNECTED | SS ISCONFIRMING)) == 0) 
737 return (ENOTCONN); 
738 if (error - copyin((caddr t) uap-»alen, (caddr t) & len, sizeof(len))) 
739 return (error); 
740 m = m.getclr(M WAIT, MT SONAME); 
741 if (m -- NULL) 
742 return (ENOBUFS); 
743 if (error -'(*so-»so proto-»pr usrreqd) (so, PRU PEERADDR, 0, m, 0)) 
744 goto bad: 
745 if (len » m-»m len) 
746 len - m-»m len; 
747 if (error - copyout(mtod(m, caddr t), (caddr t) uap-»asa, (u int) len)) 
748 goto bad; 
749 error = copyout((caddr t) & len, (caddr t) uap-»alen, sizeof(len)); 
750 bad: 
751 m freem(m); 
752 return (error); 
753 } 
uipc, syscalls.c 
O 17-23 getpeername 000 
719-753 getsockname getsock file 
( TP4) ENOTCONN 
mbuf 
PRU PEERADDR mbu 




















































































































































































































Chi puht M Ú 17| uni 447 


























U U U 0 D U D D 0 U D mom D 0 D Ú 
17.8 UI 


uggaumaumggguagimultitlutliliullli setcsockopt[] getsockopt 
U U U 0000000 DUD D UD U U U UD UD UD D DDD fentif iocetiD D Ul Lu lul 
getsockname[] getpeername[] JU 020090 


U U 


17.1 000000 mbuff] O (MELEN, 28 0 000 0 ? 
172 OQ 1770 0000000000 SOo_LINGER] |] ? 
173 [ 179000 00 timeval 000000000090 te» £v. see Y nz[] D Ú 
Hd |[D00000000000000 
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(routing policy) 
Net/3 
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«[] 20 


182 OOUUU 


Net/3 18-1 
1-1 ) 















































































































































































































































































































































Internet 
I 
Solaris 23 !.1.29 SVR4 


BSD/386 1.1 BSD /386 1.1 






0000 140.252.13.0 


0181 9000000000 








18-2 18-1[] bsdi 













































































“ 








































































































netstat 


Flags” 






























































































































































































































































/etc/netstart shell 


















































18 


Radix 












































449 





bsdi $ netstat -rn 


Routing tables 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Internet: 
Destination Gateway Flags Refs Use Interface 
default 140.252.13.33 UG $ 0 3 le0 
127 127.0.0.1 UG S R 0 2 100 
127.0.0.1 127.0.0.1 UH 1 55 100 
128.32.33.5 140.252.13.33 UGHS 2 16 leù 
140.252.13.32 link#1 U C 0 0 led 
140.252.13.33 8:0:20:3:£6:42 UH L 11 55146 le0 
140.252.13.34 0:0:c0:c2:9b:26 UH L 0 3 led 
140.252.13.35 0:0:c0:6£:2d:40 UH L 1 12 100 
140.252.13.65 140.252.13.66 UH 0 41 s10 
224 link#1 U C 0 0 led 
224.0.0.1 link#1 UH L 0 5 led 
0182 QO es D D D D 0 
1) route sun(140 252 13 33) sun 
Internet[] PPP 
2) 127 (U gated) 
/etc/netstart route 
(O 5-27) 127.0.0.1 
3) (127.0.0.1) ifconfig 
4) [| vangogh.cs.berkeley.edu(128.32.33.5) route 
( 140.252.13.33) 
TCP 
TCP 27-3 
5) leo ifconfig 
140.252.13.32 
6) sun(140.252.13.33)[] svr4(140.252.13.34) ARP 
21 
7) (140.252.13.35) IP 
IP 4.4BSD 
21.13 
8) 140.252.13.65 ifconfig SLIP 
9) 244 route 
10) 224.0.0.1( all-host group) Ping 224.0.0.1 
“ Ping 224.0.0.1” 























































































































































































































18-2 18-25 















































































































































u Flags ” 
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TCP/IP 2 
G ( ) 
H 
netstat 
1 
S 18-2[] route 
C (clone) 
(140.252.13.32) ARP 
224 
(U 224.0.0.1) 
L ARP 
R ( ) 
NET/2 
127 6.6 
4.3BSD Reno IP 
0.0.0.0 
[Leffler et al. 1998] 11.5 
hash hash Net/l 
4.3BSD Reno [Sklower 1991] 
OSI 
32 IP 
Net/3 Patricia [Sedgewick 1990] (Patricia 
Patricia ”) 
32 bit IP 
48 bit XNS OSI 
Patricia Van Jacobson [] [Sklower 1991] 






























































































































































(search key) 





















































































































































































































































































































































































































































































































































































































































































































































































































































China-bubıcom m moon 451 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































18-3 127.0.0.1[] 127.0.0.2 
127.0.0.1( 1 Oxffffffft) 127.0.0.0( 
Oxff000000) 
O O O =127.0.0.1 Hl D D =127.0.0.2 
gu uaa uu 0000 
1 H H 71000001 71000001 71000002 71000002 
2| 0000 71000001 71000001 71000001 71000000 
3 | 00000 mmm ff000000 ffffffff ff000000 
4 | 1930000 7£000001 7£000000 7£000002 71000000 
204000 Og U U u Og 
0 18-3 O OG 127.0.0.19 127.0.0.20 0000 0000000 
127.0.0.1 
(127.0.0.1) 
18-4 18-2[] Net/3 -A netstat 
18-4 
oF pit 32 | 
0x00000000 


oF pit 33 | oT pit 33 Jen 


oF pit 63 JA 2E pit 36 9n | as JO 
0x££000000 i 


0.0.0.0 








127.0.0.0 127.0.0.1 128.32.33.5 Ox££000000 
0xf£000000 

off bit 62 |" 

OXffffffe0 140.252.13.65 224.0.0.0 224.0.0.1 


Oxff000000 


"as ¿ES 


140.252.13.32 140.252.13.33 140.252.13.34 140.252.13.35 
Oxffffffeo 


0 18-4 0000 18-20 Netv30 00 
































end” 
















































































0 1 " end” [|] “ default” 






















































































































































































































































































































































































(internal node) (node) | 
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TCP/IP 2 
Oxffffffff 
( 
18-4 
18-5 Sockaddr in 
0000 32 63 
.| 00 [] 
mo 1 2 4 8 
D 18-5 Internet] DD 00000000 
IP 32 63 16 
2(AF_INET) 
IP 18-6 
IP 
18-4 

1. 

127.0.0.1 — 32[] 0 
330 1 
63[] 1 
(127.0.0.1) (127.0.0.1) 
DB 3333 3333 4444 4444 4455 5555 5555 6666 
ü D 2345 6789 0123 4567 8901 2345 6789 0123 
0010 10.1.2.3 

0111 0000 0000 0000 0000 0000 0000 0001 112.0.0.1 
0111 1111 0000 0000 0000 0000 0000 0000 | 127.0.0.0 
0111 1111 0000 0000 0000 0000 0000 0001 127.0.0.1 
0111 1111 0000 0000 0000 0000 0000 0011 127.0.0.3 
1000 0000 0010 0000 0010 0001 0000 0101 128.32.33.5 
1000 0000 0010 0000 0010 0001 0000 ' 0110 128.32.33.6 
1000 1100 1111 1100 0000 1101 0010 0000 140.252.13.32 
1000 1100 1111 1100 0000 1101 0010 0001 | 140.252.13.33 
1000 1100 1111 1100 0000 1101 0010 0010 140.252.13.34 
1000 1100 1111 1100 0000 1101 0010 0011 | 140.252.13.35 
1000 1100 1111 1100 0000 1101 0100 0001 | 140.252.13.65 
1110 0000 0000 0000 0000 0000 0000 0000 | 224.0.0.0 






0000 










224.0.0.1 


[18-6 [ 18-20 0 18-40 000000000 












































18 

















Radix 
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2. 
140.252.13.35 32] 1 
33[ 0 36[] 1 570 0 62[] 1 63[ 1 
140.252.13.35 
3. 
127.0.0.2 32[] 0 330 1 6310 
127.0.0.0 
(Oxff000000) 
4, 
10.1.2.3 320 0 331 0 “ end” [] " default” 
0.0.0.0 
( end) 
( ) 0x00000000 
(0) 
5. 
127.0.0.3 320 0 33[] 1 63[ I 
127.0.0.1 
63 
(Oxff000000) 127.0.0.0 
127.0.0.0 630 0 127.0.0.0 
6. 
112.0.0.1 320 0 330 1 63] 1 
127.0.0.1 
63 
(0xff000000) 
63[] 0 127.0.0.0 
(112.0.0.0) 
63 33 
( 32) 
(112.0.0.1) (0x00000000) 
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TCP/IP 2 
32] 0 33 0 “ end" [] “ default” 
0 
7. 
224.0.0.5 321] 1 331 35 0 63[] 1 
224.0.0.1 
63 Oxff000000 
224.0.0.0 
63[] 0 224.0.0.0 
N di ( 18-2) 224.0.0.5 
Destination Gateway Flags Refs Use Interface 
224.0.0.5 link# UHL 0 0 led 
18-7 35 18-4 
224.0.0.5 
8. 
18-8 
3-32 
224.0.0.0 224.0.0.1 
*rt_tables radix_node_head Oxff000000 
O0 18-7 DD 224.0.0.5[] 0000 
rt tables[AF INET] Internet O 18-60 00 
*radix node head radix node 
18-4 " bit 32" 
radix node 18-4 ( ) 
radix node 




































































































































































mask rnhead 





rn inithead 
















































































radix node head 


























18-4 
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° rtentry 18-8 rtentry 
rtentry radix_node 
rtentry 
rt_tables[]: radix node head() rtentry() : inpcb() 


op radix node() 
Y | (127.0.0.1) 
AF INET-2| J radix node() 
Reeg radix node() u) 
(left end) ' 
| radix node() 
(bit 32) 





inpcb() 










mask rnhead: radix node head() 
rtentry() 
radix node() 
(140.252.13.32) 
radix node() I inpcb() 
(bit 33) 






ifnet: le_softc[0]: sl_softc[0]: loif: 


a 
Q 
Q 
EJ 
É 
fth 
H 
= 
ke 
a 
Le) 
E 
får 
jas 
~ 
ks 





sockaddr_d1{} sockaddr dl() sockaddr dl() 





0188 00000000000 















































































































































rtentry 












































































































































ifnet ifaddr 
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TCP/IP [l-2 
rtentryl] | (U ) 
° UDP[] TCP (O 22-1) PCB( 22) 
rtentry [] route 0 IP UDP[] TCP] [|] g 0 
0 PCB[] route | ip output] |] 0 
PCB 
18.3 [JU U Ú 
4.3BSD Reno 
(routing socket) 4.3BSD Reno (U route ) 
ioctl 4.3BSD Reno PF ROUTE 
0 Il PF ROUTE UDE [] (raw socket)[] [] 
LU LU U U U (U U LU LU U U U ) 
18-9 12 rt msghdr[] [| (J 19-16) 
rtm type 5 (| ) | 0 12 
19 | 
rtm type OO000 D D DDD 0 [] U D 0 0 D 
RTM ADD . . Hogg rt-msghdr 
RTM CHANGE . . 0000000000 rt-msghdr 
RTM_DELADDR . 0000000 ifa-msghdr 
RIM_DELETE . ° Hogg rt-msghdr 
RTM GET . . n0pD00000000 rt-msghdr 
RTM_IFINFO . 0000000 rt-msghdr 
RTM_LOCK . . 00000 rt-msghdr 
RTM LOSING . 0000000 rt-msghdr 
RTM MISS . 0200000090 rt-msghdr 
RTM_NEWADDR . 0000000 ifa-msghdr 
RTM_REDIRECT . 00000000000 rt-msghdr 
RTM_RESOLVE . 0000000000000 rt-msghdr 
0189 J000000000000 
184 JO T 
0000 0000 coo 00000 18-10 
rn radix | | Patricia 
raw rout rt rt 
O O raw | 
(Touting control block) 32 
IP Net/3 
( OSI ) PF_ROUTE 


























































































































































































































China"pub.tom vo messo 457 


















































0 d 0 0 


net/radix.h radix[] [] 
net/raw cb.h 





net/route.h 





net/radix.c T (Patricia[] )[] O 
net/raw cb.c ul 
net/raw usrreq.c Ut 


net/route.c 




















° 

e: 

> 

DI 
Oooog/oo 














net/rtsock.c [] 


0 18-10 00000000 

















I arp, gated, route, N 
I routed, [] rwhod[][] ' 
| socket (PF_ROUTE, SOCK RAW, protocol) | 


EE 


sysctl 
0000 00000 O00000 f 000000 
























































































































































KE 
a 
PRU_SEND SK 
E 
8 
13 g 
Ë SE Së 
m +N 13) LS 
5 Ne Ë 
B MOS 3 
= EN = 
Ë 
1f up, if down 
000000 unun 
U D 0 D 
000000 tcp timers icmp input 
00000 DO TCPO O ICMP] 0 B U/ O TCPAPO O 
000000 000000 
DU D 0 0 DU DDD 0 
å rn_addroute rn_delete 
I 29 
= 
FR 


18-11 9000000000 
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O 18-10 00 LU U U U U U U U U U U U U U U U U U U U U U U U U U (U 0 U 
(U 12] ) 
rtalloc O Internet] Ú OOOOOOOOOOO LU U) U) U U 
ip_rtaddr|| ip_forwardll ip output[] ip setmoptions[ | |] Hl 
rtalloc in pcbconnect[] tcp. mss[] |] Lu L 
18-11 utl | 
* arp[] [] ARP Ug ARPU UL [| | Net I IP[] [| 0 0 d 21 ) 
* gated[] routed 0 E E 0 | 
( ID U 0 l U U ) | | 
e route[] Hu 
° rwhod[] uuilil sysctl | u u 
O U ¢ OD LU | | 
000000 18000000000 0000 
18.4.1 uut 
18-12 
O O pago O O 
rt_tables struct radix node head *[] 000000000990 
mask_rnhead struct radix node head * 0000000000 
rn mkfreelist | struct radix mask * NO radix mask] 000000 
max keylen int OO0O000000000000000 
rn zeros char * D D max Keven 000000000 
rn ones char * OOmax keylen D D D 100000 
maskedKey char * OO max keylen]JNHOOO0000 
rtstat struct rtstat NO DO O0 G 18-13) 
rttrash int OOO000000000 
rawcb struct rawcb 000000000090 
raw recvspace | u long OQ0000000000000 81920 0 
raw_sendspace | u_long O0O000000000000 819200 
route cb struct route cb O0000000000000000000000 
route dst struct sockaddr OOOO0000000000000 
route src struct sockaddr OOOO000000000000 
route proto struct sockproto p4400000000000 
O 18-12 Oda po gon a 00000000 
18.4.2 O00 
18-13 rtstat 
JOD | GOOD u LU U U SNMP[] ul 
18-14 netstatr H 000000 
























































































































































rtstat E 
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D D D U 

















rtstat[] U 0 [] [] SNMP 
rts badredirect 0000000000 
rts dynamic 00000000000 
rts_newgateway O0000000000 
rts unreach 000000 
rts wildcard O0000000000G000> 
0 18-13. [ rtstat [00O00000000000 








1 
0 


0 
0 
0 





netstat-rs[] 00 


029 bad routing redirects 


dynamically created routes 


new gateways due to redirectsrts_newgateway 


destinations found unreachablets_unreach 


uses of a wildcard route 








rtstat [| 


rts_badredirect 


rts_dynamic 


rts-wildcard 








18.43 SNMPI I 





D 18-14 pDg00000000 









































































































































































































































D 18-150 0 D DD iprouterable[ ID D 000 0000 0 0 
IP] O O O index = <ipRouteDest> 
SNMPI [] 0 0 0 0 
ipRouteDest rt_key PIO0OOOO0Q0.0.0.00OOOO0000 
ipRouteIfIndex rt ifp[]if index O00 0 ifIndex 
ipRouteMetricl | -1 DDOODDDUDDDUUDDDDDULD GpRoute- 
Proto] 00-10000000 
ipRouteMetric2 = OOOOOOO 
ipRouteMetric3 = U D D 000 
ipRouteMetric4 _ 000000 
ipRouteNextHop rt_gateway 000000010 O 
ipRouteType (DDD ) D D 00 D 1-000 200000 30000400 
U 
ipRouteProto 000) 0000901200 O 4=10MP[ O 0 [| 8=RIP, 13=0SPF] 
14= BGP[] 
ipRouteAge qun» uggapngagagaaggagneaducntlt 
ipRouteMask rt mask O D ipRoutedest] D BL D D 0 0 OOOO 
DU DD DDD 0 
ipRouteMetric5 =] U D D 000 
ipRouteInfo NULL 00000000 MIB d DUN 
O 18-15 PO [| [ [| ipRouteTable 
U ODO rt_flags] 000 RTF_GATEWAY 000000000000 ipRouteType 
U U TD 000000000000 iprouterypell [] 3] 0 0 iprouterroto] 00000 
RTF DYNAMIC[] RTF MODIFIED[][I LI Í ] [] ICMP| | | 4000 
U DU D UD 0 0 00 0 10 000 00 cr mask 0 0 UD UD D D 0 0 D DD 0 0 10 D 0 D D DU 
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18.5 Radix] 0 [] 000 








18-8 











radix_node_head 






















































































































































































( 
































18-16 












































radix_node_head 





























) radix_node 














radix.h 


91 struct radix_node_head { 









































































































































































































































































































































92 struct radix_node *rnh_treetop; 
93 int rnh_addrsize; /* (not currently used) */ 
94 int rnh_pktsize; /* (not currently used) */ 
95 struct radix node *(*rnh addaddr) /* add based on sockaddr */ 
96 (void *v, void *mask, 
97 struct radix node head * head, struct radix node nodes[]); 
98 struct radix node *(*rnh addpkt) /* add based on packet hdr */ 
99 (void *v, void *mask, 
100 struct radix node head * head, struct radix node nodes[]); 
101 struct radix node *(*rnh deladdr) /* remove based on sockaddr */ 
102 (void *v, void *mask, struct radix node, head * head); 
103 struct radix node *(*rnh delpkt) /* remove based on packet hdr */ 
104 (void *v, void *mask, struct radix node head * head); 
105 struct radix node *(*rnh matchaddr) /* locate based on sockaddr */ 
106 (void *v, struct radix node head * head); 
107 struct radix node *(*rnh matchpkt) /* locate based on packet hdr */ 
108 (void *v, struct radix node head * head); 
109 int (*rnh walktree) /* traverse tree */ 
110 (struct radix node head * head, int (*£) (0), void *w); 
111 struct radix node rnh_nodes[3]; /* top and end nodes */ 
112 3; i : 
radix.h 
U 18-16 radix node head 000000000090 
92 rnh_treetop radiz node radix node heBd 
radix node ([] 18-8) 
93-94 rnh addrsizel| rnh pktsize 
rnh addrsize 
rnh pktsize radix 




























































































































































































































































































































































































































































































































































































































































































95-110 rnh addaddr|| rnh walktree 
18-17 rn inithead 
Net/3 R 0 O rn initnead] OOO 

111-112 18-18 rnh_addaddr rn_addroute 
radix_node 18-8 rnh_addpkt NULL 

radix node head rnh_deladdr rn_delete 

N rnh_delpkt NULL 

radix_node Feentry rnh_matchaddr rn_match 
radix_node rnh_matchpkt NULL 

41-45 rnh_walktree rn_walktree 







































































union 
































































































































U 18-17 [] radix node head 0000 
000000 
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Net/3 union 
#define 
41-42 rn_mklist 18.9 rn_p 
43 rn_b 
rn_b 18-4 rn_b 32 
rn_b - 1 (index of the network mask) 
18-19 18-4 
A radix.h 
40 struct radix_node { 
41 struct radix_mask *rn_mklist; /* list of masks contained in subtree */ 
42 struct radix_node *rn_p; /* parent pointer */ 
43 short rn b; /* bit offset; -l-index(netmask) */ 
44 char rn_bmask; /* node: mask for bit test */ 
45 u_char rn_flags; /* Figure 18.20 */ 
46 union { 
47 struct { /* leaf only data: rn b < 0 */ 
48 caddr_t rn, Key; /* object of search */ 
49 caddr t rn Mask; /* netmask, if present */ 
50 struct radix node *rn, Dupedkey; 
51 ) rn leaf; 
52 struct ( /* node only data: rn b »- 0 */ 
53 int rn Off; /* where to start compare */ 
54 struct radix node *rn L; /* left pointer */ 
55 struct radix node *rn R; /* right pointer */ 
56 ) rn node; 
57 ) rn_u; 
58 ); 
59 #define rn dupedkey rn u.rn leaf.rn, Dupedkey 
60 #define rn, key rn u.rn leaf.rn Key 
61 #define rn mask rn u.rn leaf.rn Mask 
62 #define rn off rn u.rn node.rn Off 
63 #define rn 1 rn u.rn node.rn L 
64 #define rn r rn,u.rn node.rn R . 
radix.h 
O 18-18 radix node 000000000 
32 bit PO O (0 O 32- 36 - 
4444 4444 4455 5555 
0123 4567 8901 2345 
00000000: i 0000 0000 0000 0000 
££000000: 0000 0000 0000 0000 
ffffffe0: 1111 1111 1111 1111 
018-19 [000000 
0 0 32 
44 rn bmask 0 1 
0 rn bmask rn off 
45 18-20 rn_flags 
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RNF ACTIVE | [BLOOD HB H (alive)(Q O rtfree) 
RNF NORMAL | I00000000 000000) 
RNF ROOT O00000000 
O 18-20 rn flags [| U 
RNF ROOT radix node head radix ( 
) 
48-49 rn key rn mask 
rn mask 1[] ( 
) 
18-21 18-4 140.252.13.32 radix_node 
0000 63000 radix nodet) 

















radix node() 

































140. 

62] 9 [c] 
rn dupedkey 

255. 

radix mask() 


sockaddr in() 


252. 13 . 32 


[fe oao 0 |] 


255.255.224 


aa 0 | 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































D 18-21 OG 18-40 0 0 D 140.252.13.320  O O0 radix node [0 
18-22 radix mask 
radix node radix mask 
18.9 | 
- 60] rn b 59[] rn key sockaddr in 
16 2(AF INET) rn mask[] rm mask 8 
0( AF_UNSPEC ) 
50-51 rn_dupedkey 18.9 
52-58 rn_off 18.8 rn l[]rn r 
18-22 radix mask 
76-83 rm mask 
radix node radix mask 
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rn_mklist 






































mklist rn_mkfreelist 


















































































































































radix_mask 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































— radix.h 
76 extern struct radix_mask ( 
77 short rm_b; /* bit offset; -l-index(netmask) */ 
78 char rm unused; /* cf. rn bmask */ 
79 u char rm flags; /* cf. rn flags */ 
80 struct radix mask *rm mklist; /* more masks to try */ 
81 caddr t rm mask; /* the mask */ 
82 int rm refs; /* # of references to this struct */ 
83 ) *rn mkfreelist; . 
radix.h 
O 18-22 radix mask DI 
18.6 [I UL 
1) rtalloc 
2) route rtalloc 
3) route rtentry 
18-8 UDP[] TCP( 22[] ) (PCB) route 
18-23 
route.h 
46 struct route { 
47 struct rtentry *ro rt; /* pointer to struct with information */ 
48 struct sockaddr ro, dst; /* destination of this route */ 
49 ); 
route.h 
O 18-23 route O JJ 
ro dst Internet 
Sockaddr in ro dst 
8-24 IP 
. route 
route 0( PO eE )J UDP[] TCP PCB 
route ip_output 
. route rtentry (ro_rt ) 
route IP 
IP so_dst 
rtalloc TCP 
UDP sendto 
° rtalloc ro_rt ip_output 
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(U 18- 











































































































| rt_gatewayl] 







































































































































































83 struct rtentry { 


84 struct radix node rt nodes[2]; 
85 Struct sockaddr *rt gateway; 
86 short rt flags; /* 
87 short rt_refent; za 
88 u long rt use; /* 
89 struct ifnet *rt ifp; PE 
90 struct ifaddr *rt ifa; /* 
91 struct sockaddr *rt genmask; 
92 caddr t rt llinfo; pe 
93 struct rt_metrics rt_rmx; /* 
94 struct rtentry *rt gwroute; /* 
95 1; 


96 #define rt key (r) 
97 #define rt mask(r) 

















TCP/IP [1.2 
u rtentry RTF_GATEWAY 
200 60 0) 0 | OU (dst) IP! 
0 IP] U 0 | 
18-24 rtentry | 


route.h 
/* a leaf and an internal node */ 


/* value associated with rn_key */ 

Figure 18.25 */ 

#held references */ 

raw #packets sent */ 
interface to use */ 
interface address to use */ 

/* for generation of cloned routes */ 
pointer to link level info cache */ 
metrics: Figure 18.26 */ 
implied entry for gatewayed routes */ 


((struct sockaddr *) ((r)->rt nodes-»rn key)) 
((struct sockaddr *)((r)-»rt nodes-»rn mask)) 










































































































































































































































































































































































































































































































































































































































































route.h 
U 18-24 rtentry D U 
83-84 radix_node 18-7 
rt nodes[0] 
rt nodes[l] 18-24[] | #define 
86 18-25 rt_flags O 18-20“ Flags” 0090 
netstat 
[] [] net stat Ü [] [] 

RTF BLACKHOLE O0OOOOOO0 0000 0 :D 5-27) 

RTF CLONING C OOOOOOOOO (0 ARPO D ) 

RTF DONE d DU D D D 00 DDD 00 DD 0 

RTF DYNAMIC D (DU 0 DD 0000 

RTF GATEWAY G D D DDD DD DD (00000) 

RTF HOST H po (00000000 7 

RTF_LLINFO L [ rt 11info] 000000 ARPOO 

RTF_MASK m 48000 (000) 

RTF_MODIFIED M (0000) 0090 

RTF_PROTO1 1 0200000000 

RTF PROTO2 2 OOOOOOOOO«ArRPOD) 

RTF REJECT R OOOOOOOO (00000 :D 5-27) 

RIF_STATIC s 0000000 (route D) 

RTF_UP U D 0 D 

RTF XRESOLVE x D DD DDD Doo 0 x25 

H 18-25 rt. flags [] D 
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netstat RTF_BLACKHOLE RTF_DONE 
RTF_MASK 
85 RTF_GATEWAY rt_gateway 
( IP ) rt_gwroute rtentry 
ether output([] 4-15) 
87 rt refcnt 19.3 
18-2 " Refs" 
88 rt use 0 8-24 
IP 18-2[] " Use" 
89-90 rt ifp[]rt ifa 6-5 
rt ifa 
92 rt llinfo 
RTF LLINFO 21-1 ARP 
- route.h 
54 struct rt metrics { 
55 u long rmx locks; /* bitmask for values kernel leaves alone */ 
56 u long rmx mtu; /* MTU for this path */ 
57 u long rmx hopcount; /* max hops expected */ 
58 u long rmx expire; /* lifetime for route, e.g. redirect */ 
59 u long rmx recvpipe; /* inbound delay-bandwith product */ 
60 u long rmx, sendpipe; /* outbound delay-bandwith product */ 
61 u long rmx ssthresh; /* outbound gateway buffer limit */ 
62 u long rmx rtt; /* estimated round trip time */ 
63 u long rmx rttvar; /* estimated RTT variance */ 
64 u long rmx pksent; /* #packets sent using this route */- 
65 ); 
route.h 
[] 18-26 rt metrics U U 
93 18-26 rt metrics rtentry 27-3 TCP 
54-65 rmx locks 
20-13 
ARP( 21[] ms expire ARP rmx expire 
rm expire 
18-28 
rtentry 18-2 128.32.33.5 rtentry 
radix node 18-4 36 
ifaddr Sockaddr dl 3-38 6-5 ifnet 
le softc ifaddr in ifaddr 
18.7 JO U route init[] rtable_init[] |] 
7 domain 








































































































































































































18-27 















































domain 
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OSI[] Internet[] H H 


































dom family AF ISO AF_INET 
dom_init 
dom_rtattach 


PF_ROUTE 
route init 


AF UNIX | AF NS 
0 
rn inithead 

























































































































































































































































































































































































































































































































































































































































































































































dom rtoffset | 48 32 0 16 
dom_maxrtkey | 32 16 0 16 
0 18-27 domain JI00000000000 
PF route 
dom rtattach rn inithead Unix 
rtentry() inpcbt} 
rn_mklist 
ER rn_p 128.32.33.5 
š rn_b -1 162] 0 [so[20/21[05 0 
8 rn_bmask 0 140.252. 13.33 
N rn_flags 162] O j|8c|fc|0d|21 0 ro_rt: = 
C rn key 16 | 2 0 4 
A rn mask O D seckaddr int) 08 | 20 | 21 | 05 å 
rn dupedkey 0 $ 
rn mklist ifnet{} 0 E 
rn_p if name le\0 a 
z rn_b 36 if_next to SLIP ifnet() 
3 rn_bmask 0x08 if addrlist a 
v rn_flags 
3 rn off 4 
8 1 
rn 1 
0 
rn_r 
rt_gateway 
rt flags UGHS 
rt_refent 2 
rt_use 16 
rt_ifp = i D D DD 
rt ifa ifaddr() | 
rt_genmask ifa, addr 20118! 1 118)3/6/0/1/|e|0108/00|20j;031£6/42 0 
rt_llinfo ifa_dstaddr 
rmx_locks ifa_netmask 110 O [0jojojoOjrejre ¡repo jojojo ¡ojo 0 
rmx_mtu ifa_ifp 
" rmx hopcount ifa next DD sockaddr d1() 
= rmx expire ifa rtrequest 
A rmx_recvpipe ifa_flags 
3 rmx_sendpipe ifa refcnt 
p rmx ssthresh | ifa metric 
i rmx rtt ifaddr{} 140.252. 13 . 33 
rmx_rttvar ifa_addr 1612| 0 j|8c|£c|oa|21 0 
rmx pksent ifa, brdaddr 140.252. 13.63 
rt. gwroute ifa netmask 1612) O |8c|fc|oaj3£ 0 
ifa ifp 255.255.255.224 
nn ifa next 1612] 0 Teeles[er[eo 0 
ifa rtrequest 
ifa flags U H H U soekaddr int) 


ifa refcnt 


ifa metric 


01828 [00000 


route() 
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dom_rtoffset ( 
JU dom maxrtkey 
Sockaddr in IP 32 
dom maxrtkey sockaddr in 16 
18-29 

main() /* kernel initialization */ 
t 

ifinit(); 

omaininit(); 
omaininit () /* Figure 7.15 */ 


{ 


ADDDOMAIN (unix) ; 
ADDDOMAIN (route) ; 
ADDDOMAIN (inet); 
ADDDOMAIN (osi); 


for ( dp = alldomains ) { 

(*dp-»dom init)(); 

for ( pr - allprotocols for this domain ) 
(*pr-»pr init) (); 







faw init() 


/* pr init() function for SOCK RAW/PF ROUTE protocol */ 
{ 


0000000000000 
} 


route init() /* dom init() function for PF ROUTE domain */ 
{ 
rn init(); 
—-rtable init(); 
} 


rn init() 
{ 
for ( dp = alldomains ) 
if (dp->dom_maxrtkey > max_keylen) 
max_keylen = dp->dom_maxrtkey; 
000000 rn-zeros,rn ones,masked key; 





rn inithead(&mask rnhead); /* allocate and init tree for masks */ 
} 
rtable init() 
t 

for ( dp - alldomains ) 

(*dp->dom rtattach) (&rt tables[dp-»dom familyl); 

} 
rn inithead() /* dom attach() function for all protocol families */ 
L 


00000000 radix node head [][] ; 


01829 000000000000 


























































































































main domaininit ADDDOMAIN 
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domain dom_init ( ) 
18-27 route_init dom_init 18-30 
e route.c 
49 void 
50 route _ init () 
51 ( 
52 rn init(); /* initialize all zeros, all ones, mask table */ 
53 rtable init((void **) rt tables); 
54) 
route.c 
O 18-30 rout init [] D 
18-32 rn_init 
18-31 rtable_init dom_ 
rtattach 
- route.c 
39 void 
40 rtable_init (table) 
41 void **table; 
421 
43 struct domain “dom; 
44 for (dom = domains; dom; dom = dom->dom_next) 
45 if (dom->dom_rtattach) å 
46 dom->dom rtattach(&table[dom-»dom family], 
47 i dom->dom rtoffset); 
483 
route.c 
[] 18-31 rtable init [J TH J DH J dom rtattach [0 
18-27 rn_inithead dom_rtattach rn 
inithead 
18.8 0000 rn init[] rn inithead[] |] 
18-32 rn_init route_init radix 
1. max_keylen 
750-761 domain max_keylen 
dom_maxrtkey 18-27 32( AF_ISO) 
OSI[] XNS max_keyl] 16 sockaddr_in 
2: rn zeros[| rn ones[| maskedKey 
762-769 max keylen rn zeros 
R Malloc malloc M RTABLE 
M DONTWAIT Bcmp|| Bcopy|] Bzero|| Free 
| 
18-33 
rn zeros 0 rn ones 1 maskedKey 
































































































































































































































China-pubutom so manono 469 















































radix.c 
750 void 
751 rn_init() 
752 1 
753 char *cp, *cplim; 
754 struct domain *dom; 
755 for (dom = domains; dom; dom = dom->dom_next) 
756 if (dom->dom_maxrtkey > max_keylen) 
757 max_keylen = dom->dom_maxrtkey; 
758 if (max_keylen == 0) { 
759 printf("rn_init: radix functions require max_keylen be set\n"); 
760 return; ` 
761 } 
762 R Mallocí(rn zeros, char +, 3 * max_keylen); 
763 if (rn zeros == NULL) 
764 panic("rn init"); 
765 Bzero(rn zeros, 3 * max kelen): 
766 rn ones = cp = rn zeros + max keylen; 
767 maskedKey - cplim - rn ones 4 max keylen; 
768 while (cp « cplim) 
769 *op++ = -1; 
770 if (rn_inithead( (void **) &mask rnhead, 0) == 0) 
771 panic("rn_init 2"); 
772 3 


A ——— ee paix 


O 18-32 rn init JQ 


max Kev len U 0 0 max keylen 000 max_keylen U D 0 | 


000 ... 0001 1 1 ... 111000 sås 000 


rn_zeros rn_ones maskedKey 


O 18-33 rn zeros [| rn ones [| maskedKey [ JJ 















































































































































































































































































































































































































































































































































































































































































































































































































































































































































3. 
770-772 rn_inithead 18-8 
mask_rnhead radix_node_head 
18-27 rn_inithead dom_attach 
18-34 Internet 
radix_node_head 
radix_node (U rnh_treetop 
) 
(rn_p) 
rnh nodes[l].rn b 32 Internet|] domain 
dom rtoffset (U 18-27) 
















































































































































































































































































































































































radix node rn off ( 4) 


rn bmask ( 0x80) radix node 

























































































































































































470 




















China=pub.com 

























































































































































































































































































































































































































































































TCP/IP 2 
18-4 33 
4[] 0x40 63 
70) 0x01 
rn_b - 33 - 1 
rt_tables[]: radix_node_head{} 
deeg 












































0 

0 

rn_addroute 

NULL 

rn_delroute 
rnh_delpkt NULL 

rn match 

NULL 

rn walktree 

rnomklist  |NULL 

rn p 










rn b 733 dix nodet) 
radix node 

rn bmask 0 rnh_nodes[0] 

[m-flas — jacmweisoor =f Ton ang 

rn zeros 

rn mask NULL 


rn dupedkey NULL 

rn mklist ` |NULL — 

rn p 

rn b 

rn bmask 

rn off 

rn p 

rn bmask 0 en d 
rnh_nodes 

| rn flags |ACTIVE|ROOT 000000 

zn ones 


rn mask 
rn_dupedkey 


32 radix_node{} 
0x80 rnh_nodes [1] 
ACTIVE | ROOT U U H 

4 000000 










-33 































































































































































































































































































































































































































O 18-34 rn inithead [] Internet O [| [| O radix node head 00 
O(rn zeros) l(rn ones) 
RNF ROOT ( RNF_) 
(NFS) 
(mount point) radix_node_head 
( ) rt_tables 

































































































































































































































































































































































China-pubıtoM w messo 471 















































18.9 [(]D Dn D D D D DI 








































































































































































































































































































































































































































































































































































































radix node 
rn dupedkey radix node 
rn mklist radix mask 
18-4 “end” [| " default" 
RNF ROOT ( 18-34 rnh nodes[0]) 0 
255.255.255.255 ( 
) ( 1 ) 
Net/3 radix 






































































































































































































































18-35 0 rn flags 
RNF | 































































































































































































































































































radix node() 


rn bmask 


rn off 


radix node() 


rn_p 
rn_flags 


rn_dupedkey 













MA 00000000 


0x80 
18-40 00 0 3200 
ACTIVE | ROOT 000 


4 















00330 0 
0000 









=33 
0 
ACTIVE | ROOT 















rn_zeros: 










radix_node{} 













0.0.0.0 
5672] o Joofoojoofoop — — 3. 7 
[rn dupedkey — NULL sockadår in 









radix_maskt} 














01835 9000000000 



































MÍ en China"pub.tom 
AA re 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































—— |] 18-4 32 
( rn_b ) rn_dupedkey 
18-34 rnh nodes[0] " end" — 
RNF ROOT rn inithead rn zeros 
rn key 0.0.0.0[] sockaddr in 
0 rn mask 
rn_zeros 
" end" 
rn key ( RNF ROOT ) rn inithead([] 18-34) 
end rn zeros " end" 


































































































rn ones 


























radix mask 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































18-4 
127.0.0.1 127.0.0.0 A 
Oxff000000 A 24 bit 16 bit 8 bit 
127.0.0 Oxffffff00 
bsdi $ route add 127.0.0.0 -netmask Oxffffff00 140 252 13 33 
127 
Internet ( ) 
0 off 
127 
127.0.0.1 
Oxffffff00 
(Oxffffffff) 1 7000 0x££000000 
127.0.0.2 0x00000000 
Oxffffff00 0 
Oxff0000 127.0.2.3 
0x££000000 were 
18-36 0x££000000 
18-4 33 0 18-36 00 000 1270000000 
127.0.0.0 
18-37 radix_nod|| radix mask 
radix node[| radix mask ( 63) 
Oxffffff00 Oxff000000 
radix node(rn b - 57 ) 
radix node Oxff000000 
















































































































































































China-pubıtoM menn 473 












































radix nodet) 
















rn b 63 

rn bmask 0x01 

[mm fiags  jacrrve f DDS DDD 

rn off 7 

radix node() radix node() for 127.0.0.1 

-57 
0 : gockaddr in 
| rn flags |ACTIVE j 127.0.0.0 
Hé[z[ 9 Trefoofoofoop — — 9 — 






radix node() 






(opp Fd Ep, — — 3 








sockaddr in 
127. 0.0.0 


[162] 0 jvrjoo[oonoo] 0 ll 












[5[ojojojrrjojooo] 0 | 






radix_mask{} 
rm_off 
rm_unused 
rm flags 

rm mklist 
rm mask 

rm refs 0 





radix mask() 

rm off -41 
rm, unused 
rm, flags 
rm mklist NULL 
rm, mask 

rm refs 0 


0 18-37 OO 127.0.0.00 00000000000 







































































































































































































































































( 






























































































































































C Oxffffff00) 















































18.10 rn match[] |] 
















































































rn match Internet rnh matchaddr 
















































































474 












































































































































China-pubecom 


































































































































































































































































































































































































































































































TCP/IP 2 
rtallocl (J rtallocl rtalloc 

) 

1) 

(O 18-38) 

2) 

3) ([] 18-43) 

18-38 rn match 
radix.c 


135 struct radix node * 
136 rn match(v arg, head) 


137 void *v arg; 

138 struct radix node head *head; 

139 ( 

140 caddr t v - v arg; 

141 struct radix node *t - head-»rnh treetop, *x; 

142 caddr t cp - v, cp2, cp3; 

143 caddr t cplim, mstart; 

144 struct radix node *saved t, *top - t; 

145 int off - t-»rn off, vlen - *(u char *) cp, matched off; 
146 /* 

147 * Open code rn search(v, top) to avoid overhead of extra 
148 * subroutine call. 

149 */ 

150 for (; t-»xn b >= 0;) { 

151 if (t-»rn bmask & cp[t-»rn off]) 

152 t - t-»rn r; /* right if bit on */ 
153 else 

154 t = t-»rn 1; /* left if bit off */ 
155 } 

156 qe 

157 * See if we match exactly as a host destination 
158 */ 

159 Cp += off; 

160 cp2 = t->rn_key + off; 

161 cplim = v + vlen; 

162 for (; cp < cplim; cp++, cp2++) 

163 if (*cp != *cp2) 

164 goto onl; 

165 /* 

166 * This extra grot is in case we are explicitly asked 
167 * to look up the default. Ugh! 

168 Ef 

169 if ((t->rn flags & RNF ROOT) && t->rn_dupedkey) 
170 t = t->rn_dupedkey; 

171 return t; ¿ 

172 onl: 


Te die 


0 18-38 mmatch [000000000000000000000 






























































































































































































































































135-145 v_arg head 
radix_node_head ([ 18-17) 
head 
off rn off (L] Internet 4 18-34) 





































































































































































































































































































18 








Radix 



















































































475 























































































































































































































































































































































































































































































































































































































rn of 








vlen ([] Internet 16) 
1. 
146-155 
(rn_b 0) rn_bmask 
rn_off Internet rn off[] 40 5U 6 7 
2. 
156-164 
18-39 Internet 



























































































































































vlen=16 
off=4 
1 
me Bl | mi L «> 
D I byte 8 


0200000000 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































WA 
D 18-39 [] D sockaddrin 0000000 
onl 
sockaddr_in 8 0 (proxy 
ARP)(21.12] ) IP 
IP ( 8 0) IP 
(U U S ) 
18-39 vlen rtallocl 
family port 
3. 
165-172 18-35 0 
RNF_ROOT RNF_ROOT 
rn_dupedkey ( 18-35 ) 
“ end” ( 0 ) 
“ end” ( 1 ) t RNF ROOT 
rtallocl 
rn match 
18-40 
173-174 cp matched_off 
175-183 do while 
18-4 IP 
140.252.13.60 140.252.13.32( 62[] 63 0) 
18-41 18-40 for 



































































































































































































































































































































476 





China-bubcom 












































TCP/IP 2 
radix.c 
173 matched_off = cp - v; 
174 saved_t = t; 
175 do { 
176 if (t->rn_mask) { 
177 Zë 
178 * Even if we don't match exactly as a host; 
179 * we may match if the leaf we wound up at is 
180 * a route to a net. 
181 Wi 
182 cp3 = matched off + t->rn mask; 
183 cp2 = matched off + t->rn key; 
184 for (; cp < cplim; cp++) 
185 if ((*cp2++ ^ *cp) & *cp3++) 
186 break; 
187 if (cp == cplim) 
188 return t; 
189 cp = matched off + v; 
190 } 
191 } while (t = t->rn_dupedkey); 
192 t = saved t; 
radix.c 
0 18-40 zn match [] [] 0000000000000 
140.252. 13. 
search key: 


radix node () 





4 < ! cplim 


cp 


cp2 


140.252. 13 | 32 


[&e[fe]va[29] — — 3 — — —-] 
| 


rn dupedkey 





255 . 255 . 255 . 224 


143 323 Cl —— —9 


cp3 


01841 DD Da D UD 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































sockaddr in 
max keylen 0 
184-190 
( 18.1) 
IP 18-42 IP 
140.252.13.188 570 62[] 63 
0 18-41 
(140.252.13.60) UL 
0) 


Chi HIT 180 Radix 






































477 









































000 = 140.252.13.60 | 0 00 = 140.252.13.188 
00000 ep: 0011 1100 = 3c 1011 1100 = 
000000 (*cp2): 0010 0000 = 20 0010 0000 = 20 
OG: 0001 1100 1001 1100 
D (11 H 0] (*cp3): 1110 0000 = eo 1110 0000 = eO 
Bun: 0000 0000 1000 0000 
0 18-42 000000000000000 





































































































































































































































































































































































































191 
rn match 18-43 
radix.c 
193 /* start searching up the tree */ 
194 do { 
195 struct radix mask *m; 
196 ` t = t->rn_p; 
197 if (m = t->rn_mklist) ( 
198 /* ; 
199 * After doing measurements here, it may 
200 * turn out to be faster to open code 
201 * rn_search_m here instead of always 
202 * copying and masking. 
203 */ 
204 off = min(t->rn off, matched off); 
205 mstart = maskedKey + off; 
206 do { 
207 cp2 = mstart; 
208 cp3 = m->rm mask + off; 
209 for (cp = v + off; cp < cplim;) 
210 *cp2++ = *cp++ & *cp3++; 
211 x =.rn search(maskedKey, t); 
212 while (x && x-»rn mask !- m-»rm mask) 
213 x = x-»rn dupedkey; 
214 if (x && 
215. (Bemp(mstart, x-»rn key + off, 
216 vlen - off) == 0)) 
217 return x; 
218 } while (m = m->rm_mklist); 
219 } 
220 } while (t != top); 
221 return 0; 
222 }; 
radix.c 


193-195 do while 





0 18-43 mm match D 0000000 U 




















































































































196 


















































































































































































































































197-21 


0 


rn_mklist 






































































































































radix_node 





























































































































































































































































































































radix_mask 





















































radix_node 























do while 
























































478 reran 0° Lmzchuktnh 
emnet am] 
























































140.252.13.188 18-44 for 

































































































































































































































































































































































askedKey Oxffffffe0 |[] 18-4 

















m 


140.252.13.32 62 











































































































140.252. 13 . 188 = $ 
matched_off = h ! 
T cplim 


cp 

















DUU 


radix nodef) 


radix_mask{} 






62 
2 
RNF_ACTIVE 

























maskedkey:| 


mstart 
cp2 


0 18-44 )00000000000000000 



































rn search( 18-48 ) 



















































































































































































































































































































































































































































































































































































































































































for 
U maskedKey t 18-45 | 
maskedKey[] 
maskedKey: b u 
— off=7 > 
mstart 
[] 18-45 0 [ zn search [] U maskedKey 
Oxa0[] Oxbc(188 JN 0xeo( ) 
211 rn search 
LU U U U U l U U 90 [] 18-45 
18-4 140.252.13.32 0xa0 62[] 63 0 18-46 






































































































































Bcmp 
















































































































































































Chinaspubitom so mann 479 



























































| vlen - off =9 








mstart 


U 18-46 maskedkey [I 00000000 


140 . 252. 13 . 188 








radix_node{} V 





ACTIVE | ROOT 
4 





off =4 vlen - off = 12 | 


mstart 






rn p 
rn b 
rn bmask 


radix node() 


rn, 
rmn, 


LD 
L.D 






0 
ACTIVE | ROOT 







NULL 














mp — 
mb dE 


rn dupedkey 








0 18-47 OOO000000000000000 msearch 


480 


























China-bubcom 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
212-221 while 
rn_mask m->rm_mask 18-36 18-37 
63 do while m radix_mask 
OxffffffO0O0[] rn search 127.0.0.0 
rm mask m-»rm mask Bcmp m 
radix mask ( Oxff000000) do 
while rn search 127.0.0.0 
rn mask m->rm_mask|| While rn mask||m- 
>rm mask 
140.252.13.188 62 
rn mklist 
18-47 maskedKey( 0) 
rn search ( ) 18-4 
" default" 
rn search x rn_b - 330 radix node 
x->rn_mask( )[] m->rm mask 
x->rn dupedkey x while x-rn_mask 
m->rm_mask while Bcmp mstart 12 0 
x->rn_keyl] 4 12 0 x 
18.11 rn search[|[] 
rn match rn search 
18-48 
radix.c 
79 struct radix_node * 
80 rn search(v arg, head) 
81 void *v arg; 
82 struct radix node *head; 
83 ( 
84 Struct radix node *x; 
85 caddr t v; 
86 for (x - head, v - v arg; x-»rn b »- 0;) ( 
87 if (x-»rn bmask & v[x-»rn offl) 
88 X - X-»rn r; /* right if bit on */ 
89 else 
90 x = x-»rn 1; /* left if bit off */ 
91 } 
92 return (x); 
93 ); ; 
radix.c 


[] 18-48 rn search DI 











18-38 





























































































































































































































18 











Radix 























481 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































0 1 
18.12 Of 
IP IP IP 
| 
IP 
Internet route route 
UDP[] TCP IP Internet 
Internet routell UU 
Patricia OD | 
Patricia Patricia 
[Sklower 1991] radix 
Net/1 radix Net/1 
OD 
18.1 18-3 
18-40 
18.2 Net/3 20 000 (IP ) 











































































































































































































































































































18.3 radix node 
























































0190 000000060 


























































































































































































































































































































































































































































































































































































































































































































































































































19.1 OO 
rtalloc|| rtallocl rtrequest 
rtinit 
(|| route ) (routed[] gated) 
sysctl 





























































































































































































































































































































19.2 rtalloc[|] rtalloci|] |] 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































rtalloc[|rtalloc1l 19-1 

rtalloc 

58 void route.c 

59 rtalloc(ro) 

60 struct route *ro; 

61 I 

62 if (ro->ro_rt && ro->ro rt->rt ifp && (ro->ro rt->rt flags & RTF UP)) 

63 return; /* XXX */ 

64 > ro-»ro rt = rtallocl(&ro->ro dst, 1); 

65 } 

route.c 
[] 19-1 rtalloc 0 0 
58-65 ro TCP[] UDP Internet PCB([] 220 ) route 
FO rtentry (U ro rt ) 
rtallocl 1 
19-2 rtallocl rnh_matchaddr Internet 
rn match[]([] 18-17) 

66-76 sa family 

1 rn match 
77-78 

1) 

2) rn match 
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3) radix_node RNF_ROOT 
end RNF_ROOT 
route.c 
66 struct rtentry * 
67 rtallocl(dst, report) 
68 struct sockaddr *dst; 
69 int report; 
70 ( 
71 struct radix node head *rnh = rt tables[dst->sa family]; 
72 struct rtentry *rt; 
73 struct radix node *rn; 
74 struct rtentry *newrt = 0; 
75 struct rt_addrinfo info; 
76 int s = splnet(), err = 0, msgtype = RTM MISS; 
77 if (rnh && (rn = rnh->rnh matchaddr((caddr t) dst, rnh)) Së 
78 ((rn->rn flags € RNF ROOT) == 0)) ( 
79 newrt - rt - (struct rtentry *) rn; 
80 if (report && (rt-»rt flags & RTF CLONING)) ( 
81 err - rtrequest(RTM RESOLVE, dst, SA(0), 
82 SA(0), 0, &newrt); 
83 if (err) ( 
84 newrt - rt; 
85 rt->rt_refcnt++; 
86 goto miss; 
87 } 
88 if ((rt = newrt) && (rt->rt flags & RTF_XRESOLVE)) { 
89 msgtype = RTM_RESOLVE; 
90 goto miss; 
91 } 
92 } else 
93 rt->rt_refent++; 
94 } else { 
95 rtstat.rts_unreach++; 
96 miss:if (report) { 
97. bzero((caddr t) & info, sizeof(info)); 
98 info.rti_info[RTAX_DST] = dst; 
99 rt_missmsg (msgtype, &info, 0, err); 
100 } 
101 1 
102 splx(s); 
103 return (newrt); 
104 } 
route.c 
[] 19-2 rtalloc1 [| [| 
2. 
94-101 
rts unreach rtallcol (report)[]! 
RTM MISS 
79 radix node EE 
newrt rtentry ([] 18-24) radix_node 
18-8 rn_match radix_node 
rtentry rtentry 















































































































































































































































484 iu: China=pubecom 
OF ran pang Tan 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































3. 
80-82 RTF CLONING 
rtrequest RTM RESOLVE rtentry 
ARP 
4. 
83-87 rtrequest newrt rn match 
miss RTM MISS 
5. 
88-91 rtrequest RTF XRESOLVE 
miss RTM RESOLVE 
IP x.121 
6. 
92-93 RTF CLONING 
rtallocl 7 
19-3 































































































































































































































































































































































































5 6 rt_refcnt rtrequest 
























































RTM_RESOLVE rtrequest 



























































19.3 [| RTFREE[] rtfree[| |] 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































RTFREE 19-4 1 rtfree 

209-213 rtfree 19-5 rtentry 
22-7 
rt free 
105-115 0 
RNF ACTIVE] RNF ROOT 
RNF ACTIVE RNF ROOT 
rn inithead end! 
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- route.h 
209 #define RTFREE(rt) \ 
210 if ((rt)-»rt refcnt <= 1) N 
211 rtfree(rt); \ 
212 else \ 
213 (rt)-»rt refcnt--; /* no need for function call */ 
route.h 














[] 19-4 [] RIFREE 


106 rtfree(rt) 
107 struct rtentry *rt; 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































108 ( 
109 struct ifaddr *ifa; 
110 if (rt == 0) 
111 panic("rtfree"); 
112 rt-»rt refcnt--; 
113 if (rt-»rt refcnt <= 0 && (rt->rt flags & RTF UP) == 0) ( 
114 if (rt->rt nodes-»rn flags & (RNF ACTIVE | RNF ROOT)) 
115 panic("rtfree 2"); I 
116 rttrash--; 
117 if (rt->rt_refcnt < 0) { 
118 printf("rtfree: %x not freed (neg refs)\n", rt); 
119 return; 
120 ) 
121 ifa = rt->rt_ifa; 
122 IFAFREE(ifa); 
123 Free(rt_key(rt)); 
124 Free(rt); 
125 ) 
126 ) 
route.c 
[] 19-5 rtfre 000000 rtentry DUO 
116 rttrash 
rtrequest 
0 
117-122 IFAFREE ifaddr 
ifafree 
2. 
123-124 rt_setgate 
Free 
rtentry 
(rt. refcnt) 
18-2 0 
rtfree RTF UP 0 
rtrequest 
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TCP/IP 2 
° ( ) 
rtinit RTM_ADD rtquest 
1 rtinit 0 
0 
route 
route_output RTM_ADD rtrequest 
1 route_output 0 
0 
«[] TCP[] UDP IP ip output rtalloc[| rtalloc 
rtallocl 19-3 rtallocl 
(held route) 
route rtentry 
rtfree 0 rtentry 
e RTFREE[] rtfree 8-24 ip_output 
22 
rtallocl 
rtallocl 
rtrequest RTF_UP 
( 0) rtfree rtfree 0 
rtrequest 0 rtfree 
1 rtfree 0 
19.4 rtrequest[] |] 
rtrequest 19-6 


















































































































































































































































































































































































































































[] 19-6 [| [| rtrequest [0 OU 
rtrequest switch case RTM ADD|| RTM DELETE 
RTM RESOLVE 19-7 RTM DELETE 
290-307 dst 
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sa_family flags ( 
) netmask 
route.c 
290 int 
291 rtrequest (req, dst, gateway, netmask, flags, ret_nrt) 
292 int req, flags; 
293 struct sockaddr *dst, *gateway, *netmask; 
294 struct rtentry **ret nrt; 
295 1 
296 int s = splnet(); 
297 int error = 0; 
298 struct rtentry *rt; 
299 struct radix_node *rn; 
300 struct radix_node_head *rnh; 
301 struct ifaddr *ifa; 
302 struct sockaddr *ndst; 
303 #define senderr (x) { error = x ; goto bad; ) 
304 if ((rnh = rt_tables[dst->sa_family]) == 0) 
305 senderr (ESRCH) ; 
306 if (flags & RTF_HOST) 
307 netmask = 0: 
308 switch (req) { 
309 case RTM_DELETE: 
310 if ((rn = rnh->rnh deladdr(dst, netmask, rnh)) == 0) 
311 senderr (ESRCH) ; 
312 if (rn->rn flags & (RNF ACTIVE | RNF ROOT)) 
313 panic("rtrequest delete"); 
314 rt = (struct rtentry *) rn; 
315 rt->rt flags &- "RTF UP; 
316 if (rt-»rt gwroute) { 
317 rt - rt-»rt gwroute; 
318 RTFREE (rt); 
319 (rt = (struct rtentry *) rn)-»rt gwroute = 0; 
320 } 
321 if (fifa = rt->rt_ifa) && ifa->ifa_rtrequest) 
322 ifa->ifa_rtrequest (RTM DELETE, rt, SA(0)); 
323 rttrash++; 
324 if (ret nrt) 
325 *ret nrt = rt; 
326 else if (rt->rt_refent <= 0) { 
327 rt-»rt refcnt++; 
328 rtfree(rt); 
329 } 
330 break; 
route.c 











U 19-7 rtrequest [ [| [| RIM DELETE DD 







































































































































































































































































1. 
309-315 rnh_deladdr (O 18-17 rn_delete) 
rtentry RTF_UP 

2. 
316-320 RTFREE 






























































































































































































































































0 rt gwroute rt 
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TCP/IP 2 
3. 
321=322 ifa rtrequest ARP 
21 ARP 
4. 
323=330 rttrash 
rtentry ( ret nrt ) 
rtfree ret nrt 
0 | rtfree 
break 
19-8 RTM RESOLVE rtallocl 
RTF_CLONING 
rtallocl 
331 case RTM RESOLVE: SE 
332 if (ret_nrt == 0 || (rt = *ret_nrt) == 0) 
333 senderr (EINVAL); 
334 ifa = rt-»rt ifa;- 
335 flags = rt->rt flags € "RTF CLONING; 
336 gateway = rt->rt gateway; 
337 if ((netmask - rt-»rt genmask) -- 0) 
338 flags |= RTF HOST; 
339 goto makeroute; Nuls 
O 19-8 rtrequest [| [| [| RIM RESOLVE T) 
331-339 ret nrt 
RTF CLONING ([] 19-2) rt ifa 
rt gateway (RTF CLONING ) rt genmask 
RTF HOST 
rt genmask 
case makeroute 
19-9 RTM ADD 
5. 
340-342 ifa_ifwithroute (dst) 
ifaddr 
6. 
343-348 rtentry 
radix_node rt_flags 
flags RIF UP 
7. 
349-352 rt gateway (U 19-11) (dst) gateway 
gateway rt key!| rt gateway||rt gwroute 




















































































































8. 
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route.c 
340 case RTM_ADD: 
341 if ((ifa = ifa_ifwithroute (flags, dst, gateway)) == 0) 
342 Li senderr (ENETUNREACH) ; 
343 makeroute: 
344 R Malloc(rt, struct rtentry +, sizeof(*rt)); 
345 if (rt -- 0) 
346 senderr (ENOBUFS) ; 
347 Bzero(rt, sizeof(*rt)); 
348 rt->rt_ílags = RTF_UP | flags; 
349 if (rt_setgate(rt, dst, gateway)) { 
350 Free(rt); 
351 senderr (ENOBUFS) ; 
352 } 
353 ndst = rt_key (rt); 
354 if (netmask) { 
355 rt maskedcopy (dst, ndst, netmask); 
356 ) eise 
357 Bcopy(dst, ndst, dst->sa len); 
358 rn = rnh-»znh addaddr((caddr t) ndst, (caddr t) netmask, 
359 i rnh, rt->rt nodes); 
360 if (rn == 0) £ 
361 if (rt->rt_gwroute) 
362 rtfree(rt->rt gwroute); 
363 Free(rt key(rt)); 
364 Free (rt); 
365 senderr (EEXIST); 
366 } 
367 ifa->ifa_refent++; 
368 rt->rt_ifa = ifa; 
369 rt->rt_ifp = ifa->ifa_ifp; 
370 if (req == RTM_RESOLVE) 
371 rt-»rt rmx = (*ret nrt)-»rt rmx; /* copy metrics */ 
372 if (ifa-»ifa rtrequest) 
373 ifa->ifa_rtrequest (reg, rt, SA(ret nrt ? *ret nrt : 0)); 
374 if (ret nrt) ( 
375 *ret nrt - rt; 
376 rt->rt_refcnt++; 
377 } 
378 break; 
379 } 
380 bad: 
381 splx(s); 
382 return (error); 
383 } 

route.c 

[] 19-9 rtrequest [|] D RIM App OO 
353-357 ( dst) rn_key 
rt maskedcopyl| dst|| netmask dst 
dst|| netmask 
1e0 IP 

( ) 12 13 




















bsdi $ ifconfig le0 inet 140.252.12.63 netmask Oxffffffe0 alias 


490 
































Chinaspubecom 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
netstat 
Destination Gateway Flags Refs Use Interface 
140.252.12.32 link#1 uC 0 leo 
9. 
358-366 rnh_addaddr (U 18-17 rn_addroute) rtentry 
EEXIST( ) 
10. 
367-369 ifaddr ifaddr|] ifnet 
11. 
370-371 RTM RESOLVE( RTM ADD) HH 
RTM ADD 
12. 
372-373 ifa rtrequest RTM ADD 
RTM RESOLVE ARP 
13. 
374-378 ret_nrt 
0 
rtrequest|| RTM_RESOLVE rt_genmask 
rt_genmask 
18-2 
[Sklower 1991] 19.2 
B 128.1 Oxffffff00 8 
8 254 
128.1 
128.1.0.0 Oxffff0000 128.1 254 
RTTs[] MTUs 
TCP 
RTT[] RTT (U 27-3) route 254 
128.1.0.0 Oxffff0000 
RTF CLONING genmask[] Oxffffff00( ) 
128.1.2.3 128.1.2 
Oxffff0000 128.1 RTF CLONING 
128.1.2 OxffffffÜ0(genmask ) 
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128.1.2.88 
19.5 rt_setgate|| [| 
(rt_key rtentry 
radix_node rn_key ) (rt_gateway) 
rt_setgate 19-10 










































































































































































































radix node() 


(00) 


radix node() 


(00) 












sockaddr in sockaddr in 


radix node() 


(00) 


radix_node{} 

(00) 
sdl_family 
sdl_index 
sdl_type 
sdl_alen 






rt_gateway 
















140.252. 13.33 



































































































































































































































































































































































































































sockaddr_in sockaddr_dl 
U 1910 (1 I] H D D LI | U D LI LI U 
18-2 127.0.0.1[] 140.252.13.33 
Internet 
route 
ARP 
19-11 rt key 
rt setgate 
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TCP/IP 2 
route.c 
384 int 
385 rt setgate(rt0, dst, gate) 
386 struct rtentry *rt0; 
387 struct sockaddr *dst, *gate; 
388 ( 
389 caddr t new, old; 
390 int dien = ROUNDUP (dst->sa len), glen = ROUNDUP (gate-»sa len); 
391 struct rtentry *rt - rt0; 
392 if (rt-»rt gateway -- Il glen > ROUNDUP(rt-»rt, gateway-»sa len)) ( 
393 : old = (caddr_t) rt key(rt); 
394 R_Malloc (new, caddr t, dlen + glen); 
395 if (new -- 0) 
396 return 1; 
397 rt->rt nodes->rn key = new; 
398 ) else ( 
399 new = rt-»rt, nodes->rn key; 
400 old - 0; 
401 } 
402 Bcopy (gate, (rt->rt_gateway = (struct sockaddr +) (new + dlen)), glen); 
403 if (old) { 
404 Bcopy (dst, new, dlen); 
405 Free (old); 
406 } : 
407 if (rt->rt_gwroute) { 
408 rt = rt->rt_gwroute; 
409 RTFREE (rt); 
410 rt = rt0; 
411 rt->rt_gwroute = 0; 
412 } 
413 if (rt->rt flags & RTF GATEWAY) { 
414 rt->rt_gwroute = rtallocl (gate, 1); 
415 } 
416 return 0; 
417 } 
route.c 
O 19-11 rt_setgate J] J 
1. 
384-391 dlen glen ROUNDUP 
4 4 
2: 
392-401 glen rt_gateway 
rn_key 
3. 
398-401 new 
4. 
402 rt_gateway 
5. 
403-406 dst 
6. 
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407-412 rt_gwroute RTFREE 
rt_gwroute 
7. 
413-415 rtallocl 
rt_gwroute rt_setgate 
rt_gwroute 










































































19.6 rtinit[][] 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Internet rtinit 
. in control rtinit 
RTM DELETE ( 6-21) 
RTM ADD 
*in ifinit rtinit (O 6-19) 
in ifinit RTF CLONING 
*in ifscrub rtinit 
19-12 rtinit cmd RTM ADD|| RTM DELETE 
- route.c 
441 int 
442 rtinit(ifa, cmd, flags) 
443 struct ifaddr *ifa; 
444 int cmd, flags; 
445 ( 
446 struct rtentry *rt; 
447 struct sockaddr *dst; 
448 struct sockaddr *deldst; 
449 struct mbuf *m - 0; 
450 Struct rtentry *nrt - 0; 
451 int error; 
452 dst = flags & RTF HOST ? ifa->ifa dstaddr : ifa->ifa_addr; 
453 if (cmd == RTM DELETE) ( 
454 if ((flags & RTF HOST) == 0 && ifa-»ifa netmask) L 
455 m = m get (M WAIT, MT SONAME) ; 
456 deldst - mtod(m, struct sockaddr *);. 
457 rt maskedcopy (dst, deldst, ifa->ifa_netmask) ; 
458 dst - deldst; 
459 ) 
460 if (rt = rtallocl(dst, 0)) { 
461 rt-»rt refcnt--; 
462 if (rt-»rt ifa !- ifa) ( 
463 if (m) 
464 (void) m free(m); 
465 return (flags & RTF HOST ? EHOSTUNREACH 
466 : ENETUNREACH) ; 
467 } 
468 } 
469 } i 
470 error = rtrequest (cmd, dst, ifa->ifa addr, ifa->ifa netmask, 
471 flags | ifa->ifa flags, &nrt); 
472 if (m) 
473 (void) m free(m); 
route.c 





H 19-12 rt init H D D] D] H rtremest [I LU n 


494 
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TCP/IP 2 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































1. 
452 
(U ifa_netmask ) 
2. 
453-459 
mbuf 
rt maskedcopy 
mbuf dst mbu 
3. 
460-469 rtallocl 
( rtallocl ) ifaddr 
4. 
470-473 rt_request RTM ADD[|| RTM DELETE rt request 
mbuf 
19-13 rtinit 
- route.c 
474 if (cmd == RTM DELETE && error == 0 && (rt = nrt)) ( 
475 rt newaddrmsg(cmd, ifa, error, nrt); 
476 if (rt->rt_refent <= 0) { 
477 rt->rt_refent++; 
478 rtfree (rt); 
479 } 
480 } 
481 if (cmd == RTM_ADD && error == 0 && (rt = nrt)) { 
482 rt->rt_refent--; 
483 if (rt->rt_ifa != ifa) { 
484 printf ("rtinit: wrong ifa (%x) was (%x)\n", ifa, 
485 rt->rt_ifa); 
486 if (rt-»rt ifa-»ifa rtrequest) 
487 rt-»rt ifa-»ifa, rtrequest (RTM DELETE, rt, SA(0)); 
488 IFAFREE(rt-»rt, ifa); 
489 rt-»rt ifa - ifa; 
490 rt-»rt ifp = ifa-»ifa ifp; 
491 ifa->ifa_refent++; 
492 if (ifa->ifa_rtrequest) 
493 ifa->ifa_rtrequest (RTM ADD, rt, SA(0)); 
494 } 
495 rt_newaddrmsg (cmd, ifa, error, nrt); 
496 } 
497 return (error); 
498 } 


474-480 
(nrt 


TU — == route.c 


O 19-13 reint JI00000 





5. 






































































































































rtreguest 0 rtentry 































































































) 
























































































































































rt_newaddrmsg 0 

























































































rtfree 
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6. 
481-482 rtrequest 0 rtentry 
(nrt) ( rtrequest ) 
7. 
483-494 ifaddr 
rtrequest ifa_ifwithroute ifa (rtrequest 
19-9 ) 
ifa_rtrequest RTM_DELETE ifaddr | | rt ifa 
ifa rtreguest 
RTM ADD 
8. 






















































































495 rt newaddrmsg[| RTM ADD 






























































19.7 rtredirect[|[] 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ICMP icmp input rtredirect[| pfctlinput([] 11-27) 
udp ctlinput[| tcp ctlinput UDP[] TCP| 
(PCB) PCB 
PCB rtfree 
IP rtalloc 
( ) 
rtredirect 
19-14 rtredirect 

147-157 dst IP (U 8-18 HD) 
gateway IP (O 8-18 R2)[] netmask 

flags RTF_GATEWAY RTF_HOST src IP 

(U 8-18 R1)[] rtp icmp input | 
netmask|| rtp 

1. 
158-162 

2. 
163-177 rtallocl 

icmp_input 

rtredirect ICMP 

k RTF DONE 

*rtalloc dst 

N (src) rt gateway 

. ([] ifa ifwithnet ifa ) 

(rt ifa) 
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27D eg rang To 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































zi gateway 
route.c 
147 int 
148 rtredirect (dst, gateway, netmask, flags, src, rtp) 
149 struct sockaddr *dst, *gateway, *netmask, *src; 
150 int flags; 
151 struct rtentry **rtp; 
152 ( 
153 struct rtentry *rt; 
154 int error = 0; 
155 short *stat = 0; 
156 struct rt addrinfo info; 
157 struct ifaddr *ifa; 
158 /* verify the gateway is directly reachable */ 
159 if ((ifa = ifa ifwithnet(gateway)) == 0) { 
160 error = ENETUNREACH; 
161 goto out; 
162 ) 
163 rt = rtallocl(dst, 0); 
164 /* 
165 * If the redirect isn't from our current router for this dst, 
166 * it's either old or wrong. If it redirects us to ourselves, 
167 * we have a routing loop, perhaps as a result of an interface 
168 * going down recently. 
169 */ 
170 #define equal (al, a2) (bcmp((caddr t) (al), (caddr t)(a2), (al)->sa len) == 0) 
171 if (!(flags & RTF DONE) && rt && ` 
172 (!equal(src, rt->rt_gateway) || rt->rt_ifa != ifa)) 
173 error = EINVAL; 
174 else if (ifa_ifwithaddr (gateway) ) 
175 error = EHOSTUNREACH; 
176 if (error) 
177 goto done; 
178 ZS 
179 * Create a new entry if we just got back a wildcard entry 
180 * or if the lookup failed. This is necessary for hosts 
181 * which use routing redirects generated by smart gateways 
182 * to dynamically build the routing tables. 
183 */ 
184 if ((rt == 0) || (rt_mask(rt) && rt_mask(rt)->sa_len < 2)) 
185 goto create; 
c route.c 
O 19-14 rtrediret 000000000090 
3. 
178-185 
2 
rn zeros([] 18-35) 
19-15 rtredirect 
4. 
186-195 
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flags RTF_HOST Net/3 ICMP 
route.c 
186 /* 
187 * Don't listen to the redirect if it's 
188 * for a route to an interface. 
189 */ 
190 if (rt-»rt flags & RTF GATEWAY) { 
191 if (((rt-»rt flags & RTF HOST) == 0) && (flags & RTF HOST)) { 
192 /* 
193 * Changing from route to net => route to host. 
194 * Create new route, rather than smashing route to net. 
195 */ I 
196 create: i 
197 flags |= RTF GATEWAY | RTF DYNAMIC; 
198 error = rtrequest ((int) RTM ADD, dst, gateway, 
199 netmask, flags, 
200 (struct rtentry ++) 0); 
201 stat = &rtstat.rts dynamic; 
202 } else { 
203 /* 
204 * Smash the current notion of the gateway to 
205 * this destination. Should check about netmask!!! 
206 */ 
207 rt->rt_ílags |= RTF_MODIFIED; 
208 flags |= RTF_MODIFIED; 
209 stat = &rtstat.rts_newgateway; 
210 rt_setgate(rt, rt_key(rt), gateway); 
211 } i 
212 ) else 
213 error = EHOSTUNREACH; 
214 done: 
215 if (rt) { 
216 if (rtp && !error) 
217 *rtp = rt; 
218 else : 
219 rtfree (rt); 
220 } 
221 out: 
222 if (error) 
223 rtstat.rts_badredirect++; 
224 else if (stat != NULL) 
225 (*stat) ++; 
226 bzero((caddr t) & info, sizeof(info)); 
227 info.rti_info[RTAX_DST] = dst; 
228 info.rti_info[RTAX_GATEWAY] = gateway; 
229 info.rti_info[RTAX_NETMASK] = netmask; 
230 info.rti_info[RTAX_AUTHOR] = src; 
231 rt_missmsg (RTM_REDIRECT, &info, flags, error); 
232 } 
route.c 
[] 19-15 rerequest 0000000 
5. 
196-201 rtrequest RTF GATEWAY||] RTF DYNAMIC 
netmask 1 
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TCP/IP 2 
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rt_setgate 
































gateway 















































212-213 

























































































( RTF GATEWAY ) 











































































































EHOSTUNREACH 





































































































214-225 






































































































































( rtp ) 






































rtfree 




































































9. 


























226-232 


_addrinfo 











































































































rt_missmsg 
































raw_input 














































































































198 DODODODO 








































































































































































































































































































































































































































































































































































































































































































































































































































































































8 

*rt msghdr 
if msghdr 
ifa msghdr 

18-11 18-9 

8 rtm addrs[| ifm addrs[| ifam_addrs 
19-16 rt_msghdr[] RTM IFINFO 19-17 
if msghdr RTM NEWADDR[| RTM DELADDR 19-18 ifa msghdr 
































139 struct rt msghdr { 


140 u short rtm msglen; /* 
141 u char rtm version; £" 
142 u char rtm_type; £* 
143 u_short rtm_index; /* 
144 int rtm flags; /* 
145 int rtm addrs; /*. 
146 pid t rtm pid; /* 
147 int rtm seq; ZS 
148 int rtm errno; £* 
149 int rtm use; Lë 
150 u_long rtm_inits; /* 
151 struct rt metrics rtm rmx;  /* 
152 ); 





















































































































































route.h 


to skip over non-understood messages */ 
future binary compatibility */ 
message type */ 


index for associated ifp */ 

flags, incl. kern & message, e.g. DONE */ 
bitmask identifying sockaddrs in msg */ 
identify sender */ 

for sender to identify action */ 

why failed */ 

from rtentry */ 

which metrics we are initializing */ 
metrics themselves */ 


route.h 


[] 19-16 rt msghdr [] [] 
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: ifh 
235 struct if msghdr { 
236 u short ifm msglen; /* to skip over non-understood messages */ 
237 u char ifm version; /* future binary compatability */ 
238 u char ifm type; /* message type */ 
239 int ifm addrs; /* like rtm addrs */ 
240 int ifm flags; /* value of if flags */ 
241 u short ifm index; /* index for associated ifp */ 
242 struct if data ifm data; /* statistics and other data about if */ 
243 }; 

ifh 
[] 19-17 if msghdr [] [] 

- ifh 
248 struct ifa msghdr ( 
249 u.short ifam msglen; /* to skip over non-understood messages */ 
250 u char ifam version; /* future binary compatability */ 
251 u char ifam type; /* message type */ 
252 int ifam addrs; /* like rtm addrs */ 
253 int ifam flags; /* value of ifa flags */ 
254 u short ifam index; /* index for associated ifp */ 
255 int ifam metric; /* value of ifa metric */ 
256 }; ifh 


O 19-18 ifa msghdr 00 
















































































































































































rtm addrs|| ifm addrs[]ifam addrs 





























































































































































































































































































































19-19 

RTA DST Ox01 RTAX DST 0 dst 0020000000 
RTA GATEWAY 0x02 RTAX_GATEWAY 1 gate 0000000 
RTA_NETMASK 0x04 RTAX_NETMASK 2 netmask 00000000 
RTA_GENMASK 0x08 RTAX_GENMASK 3 genmask 0000000000 
RTA IFP 0x10 RTAX_IFP 4 ifpaddr 00000000 
RTA IFA 0x20 RTAX_IFA 5 ifaaddr 00000000 
RTA_AUTHOR Ox40 RTAX AUTHOR 6 U U 0 0 D 0 00 D 0 
RTA BRD 0x80 RTAX_BRD 7 brdaddr 000000000090 

RTAX_MAX 8 rti-into[] 0000000 

019-19 [J DB TJ xci info [000000 
1 Ox20(RTA_IFA)] I 
(RTAX_IFA) 



































































































































































































































































































































0x87 






































































































































19-19 rt_addrinfo 19-20 
























































































































































































































































































































































































































































500 amu a: China=pubecom 
— TT 























































































































































































































































































































































































































































































































































































































































































































7 route.h 
199 struct rt_addrinfo { 
200 int rti_addrs; /* bitmask, same as rtm_addrs */ 
201 struct sockaddr *rti, info[RTAX MAX]; i 
202 }; 
route.h 
0 19-20 rt_addrinfo D 11T HB BPD BB DH D: 0 DH DU D 1 0 DID D 
rti addrs RTA_GATEWAY rti_info 
[RTA GATEWAY[] Internet 
IP sockaddr in 
19-19 rtsock.c[] rti info 
#define dst info.rti info[RTAX DST] 
RTAX AUTHOR 
rt addrinfo rtallocl([] 19-2)]] rtredirect 
(U 19-14) 19-21 rtallocl rt missmsg 

























































































































































































rt addrinfo() 


rti. info[RTAX NETMASK] 
NULL 


O 19-21 rtalloci [][][] rt missmsg [| rt addrinfo [| [| 







0 sockaddr in() 


D D OC IPL 0 


















0 
































































































































































































































rti addrs rti info 


















































































































































































































































































































































19-22 rtredirect rt missmsg 





























rt addrinfo() 


Eti info[RTAX NETMASK] | NULL 

































rti_info[RTAX_IFA] 
rti_info[RTAX_AUTHOR] - 
rti_info[RTAX_BRD] 


[ 19-22 rtredirect [|] [| [| rt missmsg [| rt addrinfo U J 














O000000 OO IPOD 
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19-23 route cb 
IP[] XNS[] OSI E u 
203-208 
raw_input 
route.h 

203 struct route cb { 

204 int ip count; /* IP */ 

205 int ns count; /* XNS */ 

206 int iso count; /* ISO */ 

207 int any count; /* sum of above three counters */ 


208 }; 
MT en route. H 


0 19-23 route co UD UU 000000 000 0 


19.9 rt_missmsg|| || 






























































19-24 rt_missmsg 19-21 19-22 rt_msgl 


mbuf| raw input mbuf| 

























































































































































































































































































516 void . 

517 rt missmsg(type, rtinfo, flags, error) 

518 int type, flags, error; 

519 struct rt addrinfo *rtinfo; 

520 ( 

521 struct rt msghdr *rtm; 

522 struct mbuf *m; 

523 struct sockaddr *sa - rtinfo-»rti info[RTAX DST]; 
524 if (route cb.any count == 0) 

525 return; 

526 m - rt msgl(type, rtinfo); 

527 if (m == 0) 

528 return; 

529 rtm - mtod(m, struct rt, msghdr *); 

530 rtm-»rtm flags - RTF DONE | flags; 

531 rtm-»rtm errno - error; 

532 rtm-»rtm addrs = rtinfo-»rti addrs; 

533 route, proto.sp protocol - sa ? sa->sa family : 0; 
534 raw input(m, &route proto, &route src, &route dst); 
535 } 





[| 19-24 rt missmsg UU 



















































































































































































































































































































































































516-525 
1. [] mbu 
526-528 rt msgl(19.12[] )[] mbu 19- 
22 rt addrinfo 19-25 mbu 
mbu raw input sbappendaddr mbuf 













































































































































































502 remo n: China+pub.tom 
—— DÉI 












































mbuf {} 000000 mbut mbuf () 
m_next m_next NULL 
m_nextpkt NULL m_nextpkt NULL 
m len 100 m len 24 
m data m data 
m type MT DATA m type MT. DATA 
m flags M PKTHDR m flags 0 
m pkthdr.len [124 Sockaddr in() 
m pkthdr.rcvif NULL (0000800) 


sockaddr_in() 
a6] D) 




































































rt msghdr() 
(760 0) 






















































































































































































































































































































































































































































































































































































































































































































































































Sockaddr in() 
aQ 0) 


































































































































































































































































































































































































sockaddr_in{} 
(«D 0 sd n» 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































[]19-25 [] rt msg HH 00000 19-220 mbuf[] 












































































































































































































































































































































































































































2. 

529—532 rtm flags|| rtm errno rtm addrs 
rti addrs 19-21 19-22 rti addrs 0 
rt msgl rti info 
3. raw input 







































































533-534 raw input 



































































































































































































































































































































































































































struct sockaddr route dst - 2, PF ROUTE, Z 
struct sockaddr route src = 2, PF ROUTE, £ 
struct sockproto route proto = { PF ROUTE |; 
sockproto 19-26 
socket.h 
128 struct sockproto { 
129 u_short sp_family; /* address family */ 
130 u_short sp_protocol; /* protocol */ 
131 ); 
socket.h 


O 19-26 sockproto [] [] 














































































































LH 














PF ROUTI 
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raw_input socket 










































































raw_input route_proto sp_protocol 





































































































































































































rt_missmsg 
sa_family( ) 19-21 19-22 AF_INET 





















































































































































19.10 rt_ifmsg|| |] 






































4-30 if up[| if dowm 19-27 rt ifmsg 


















































































































































































































































i rtsock.c 
540 void 


541 rt ifmsg(ifp) 
542 struct ifnet tifp; 

































































































































































































































































































































































































































































































































































































































































































































































543 ( 
544 struct if msghdr *ifm; 
545 struct mbuf *m; 
546 struct rt_addrinfo info; 
547 if (route_cb.any_count == 0) 
548 return; 
549 bzero((caddr t) & info, sizeof(info)); 
550 m = rt msgl (RTM IFINFO, &info); 
551 if (m == 0) 
552 return; 
553 ifm = mtod(m, struct if msghdr *); 
554 ifm->ifm index = ifp->if index; 
555 ifm->ifm flags = ifp-»if flags; . 
556 ifm->ifm data = ifp->if data; /* structure assignment */ 
557 ifm->ifm_addrs = 0; 
558 route_proto.sp_protocol = 0; f 
559 raw_input (m, &route_proto, &route_src, &route dst); 
560 ) I 
rtsock.c 
O 19-27 rt_ifmsg J U 
547-548 
1. [| mbu 
549-552 rt_addrinfo OU rt_msgl mbuf] 
rt addrinfo if msghdr 
2. 
553-557 if_data mbu ifm_addrs 
0 
3. raw input 
558-559 0 
raw_input 



















































































































































































504 





TCP/IP 









































Chinaspubscom 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































19.11 rt_newaddrmsg[] || 
19-13 rtinit RTM_ADD 
RTM_DELETE rt_newaddrmsg 19-28 rt_newaddrmsg 
rtsock.c 
569 void 
570 rt_newaddrmsg (cmd, ifa, error, rt) 
571 int cmd, error; 
572 struct ifaddr *ifa; 
573 struct rtentry *rt; 
574 ( 
575 struct rt addrinfo info; 
576 struct sockaddr *sa; 
577 int pass; 
578 struct mbuf *m; : 
579 struct ifnet *ifp = ifa->ifa_ifp; 
580 if (route_cb.any_count == 0) 
581 return; 
582 for (pass = 1; pass < 3; pass++) { 
583 bzero((caddr t) & info, sizeof(info)); 
584 if ((cmd == RTM ADD && pass == 1) || 
585 (cmd == RTM DELETE && pass == 2)) { 
586 struct ifa msghdr *ifam; 
587 int ncmd - cmd -- RTM ADD ? RTM NEWADDR : RTM DELADDR; 
588 ifaaddr - sa - ifa-»ifa addr; 
589 ifpaddr = ifp->if addrlist-»ifa addr; 
590 netmask = ifa->ifa netmask; 
591 brdaddr = ifa-»ifa dstaddr; 
592 if ((m = rt msgl(ncmd, &info)) == NULL) 
593 continue; 
594 ifam = mtod(m, struct ifa msghdr *); 
595 ifam->ifam_index = ifp->if_index; 
596 ifam->ifam_metric = ifa->ifa_metric; 
597 ifam->ifam_flags = ifa->ifa_flags; 
598 ifam->ifam_addrs = info.rti_addrs; 
599 } 
rtsock.c 
O 19-28 rt newaddamsg 2000000000 ifa msghdr 
580-581 
1. 
582 
for RTM_ADD 
RTM NEWADDR RTM ADD RTM DELETE 
RTM DELETE RTM DELADDR|| RTM NEWADDR 
RTM DELADDR ifa msghdr RTM ADD|| RTM DELETE 
rt msghdr 
583 rt addrinfo 0 
2. 
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588-591 

rti_info ifaaddr|| ifpaddr|| netmask[| brdaddr 
info[] rti info | 19-19 rt msgl[] mbu 

sa ifa addr | 

ifa msghdr 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































rt_msgl 
19-29 rt_newaddrmsg rt_msghdr 
| | 
3. 
600-609 rt mask||rt key[|rt gateway rti info 
sa rt msgl[] mbu 
rt msghdr rt msgl 
4. raw input 
616-619 raw input 
rtsock.c 
600 if ((cmd == RTM ADD && pass == 2) || 
601 (cmd == RTM_DELETE && pass == 1)) { 
602 struct rt msghdr *rtm; 
603 if (rt == 0) 
604 continue; 
605 netmask = rt_mask(rt); 
606 dst = sa = rt_key (rt); 
607 gate = rt->rt gateway; 
608 if ((m = rt msgl(cmd, &info)) == NULL) 
609 continue; 
610 rtm = mtod(m, struct rt msghdr *); 
611 rtm->rtm_index = ifp->if_index; 
612 rtm->rtm_flags |= rt->rt_flags; 
613 rtm->rtm_errno = error; 
614 rtm->rtm_addrs = info.rti_addrs; 
615 } ; 
616 route proto.sp protocol - sa ? sa-»sa family : 0; 
617 raw input(m, &route proto, &route src, &route, dst); 
618 } 
619 } 
rtsock.c 





U 19-29 rt newaddmsg 0000000000 rtmsghdr UD 


19.12 rt_msgl|] |] 
























































rt_msgl 19-25 
mbuf] rt msgl 19-22 rt msghdr[| rt addrinfo 
19-30 













































































































































































































































































506 


TCP/IP 
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e rtsock.c 
399 static struct mbuf * 
400 rt msgl (type, rtinfo) 
401 int type; 
402 struct rt_addrinfo *rtinfo; 
403 { 
404 struct rt msghdr *rtm; 
405 struct mbuf *m; 
406 int i; 
407 struct sockaddr *sa; 
408 int len, dlen; 
409 m = m gethdr(M DONTWAIT, MT DATA); 
410 if (m -- 0) 
411 return (m); 
412 Switch (type) ( 
413 case RTM DELADDR: 
414 case RTM NEWADDR: 
415 len - sizeof(struct ifa msghdr); 
416 break; 
417 case RTM IFINFO: 
418 len = sizeof(struct if msghdr); 
419 break; 
420 default: 
421 len = sizeof (struct rt msghdr); 
422 } 
423 if (len > MHLEN) 
424 panic("rt, msgl"); 
425 m->m pkthdr.len = m-»m len = len; 
426 m-»m pkthdr.rcvif - 0; 
427 rtm - mtod(m, struct rt msghdr *); 
428 bzero((caddr t) rtm, len); 
429 for (i = 0; i « RTAX MAX; i++) { 
430 if ((sa = rtinfo-»rti info[i]) == NULL) 
431 continue; 
432 rtinfo-»rti addrs |- (1 «« i); 
433 dlen = ROUNDUP (sa->sa len); 
434 m copyback(m, len, dlen, (caddr t) sa); 
435 len += dlen; 
436 } 
437 if (m-»m pkthdr.len != len) { 
438 m freem(m); 
439 return (NULL); 
440 } 
441 rtm->rtm_msglen = len; 
442 rtm->rtm_version = RTM_VERSION; 
443 rtm->rtm_type = type; 
444 return (m); 
445 } x 
=— rtsock.c 
U 19-30 rt msgi [] 0 D D D Ú Ú D 0 mbuf 
1. mbu 
399-422 mbu len 18-9 
ifa_msghdr if msghdr 
rt msghdr 
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2. mbuf 
423-424 mbuf| mbuf| 
mtod if msghdr 
84 MHLEN(100) 
3. mbu 
425-428 mbuf 0 
4. mbufl 
429-436 rt_addrinfo rti_info 
m_copyback mbuf 1 RTX. xxx| 
RTA_xxx (U 19-19) 
rti_addrs ROUNDUP 
4 
437-440 mbuf len m_copyback 
mbuf 
de 
441-445 
xxx msghdr rtm 
rt msghdr 
19.13 rt msg2[|[] 
rt msgl|| mbuf raw input 
mbuf rt msgl rt msg2 
mbu rt msg2 walkarg 
sysctl rt_msg2 
rt msg2 
1) route output RTM GET 
2) sysctl dumpentryl] sysctl iflist sysctl 
rt_msg2 19-31 2 walkarg 
41 struct walkarg { risock.c 
42 int w op; /* NET RT xxx */ 
43 int w arg; /* RTF xxx for FLAGS, if index for IFLIST */ 
44 int w given; /* size of process' buffer */ 
45 int w needed; /* #bytes actually needed (at end) */ 
46 int w tmemsize; /* size of buffer pointed to by w tmem */ 
47 caddr t w where; /* ptr to process’ buffer (maybe null) */ 
48 caddr_t w_tmen; /* ptr to our malloc’ed buffer */ 
— rtsock.c 





U 19-31 walkarg 000000 sysctl 0000000 




















































































































19-32 rt msg2 rt msgl 
































5 08 TCP/IP 2 












































Chinas pup. coN 


rtsock.c 


























































































































































































































































































































































































































































































































































































































































































































































































































446 static int 

447 rt_msg2 (type, rtinfo, cp, w) 

448 int type; 

449 struct rt_addrinfo *rtinfo; 

450 caddr_t cp; 

451 struct walkarg *w; 

452 { 

453 int i; 

454 int len, dlen, second time = 0; 

455 caddr t cp0; 

456 rtinfo->rti addrs = 0; 

457 again: 

458 Switch (type) { 

459 case RTM DELADDR: 

460 case RTM NEWADDR: 

461 len = sizeof(struct ifa msghdr); 

462 break; 

463 case RTM IFINFO: 

464 len - sizeof(struct if msghdr); 

465 break; 

466 default: 

467 len = sizeof(struct rt msghár); 

468 } 

469 if (cp0 = cp) 

470 cp += len; 

471 for (i = 0; i < RTAX MAX; i++) { 

472 struct sockaddr *sa; 

473 if ((sa = rtinfo-»rti infoli]) == 0) 

474 continue; 

475 rtinfo->rti_addrs |= (1 << i); 

476 dlen = ROUNDUP (sa->sa len); 

477 if (cp) { 

478 beopy ((caddr_t) sa, cp, (unsigned) dlen); 

479 cp += dlen; 

480 } 

481 len += dlen; 

482 } 

— UM q — sx T === — — — rtsock.c 

0 19-32 rt msg2 JI000000000 
446-455 cp 
cp rt_msg2 
route_output 
route_output sysctl 
1. 

458-470 cp 















































































































































































































































cp 
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471-482 for rti_info rti_addrs 
cpl (U O cp ) 

19-33 rt_msg2 walkarg 
483 if (cp == 0 && w != NULL && !second_time) { SE 
484 struct walkarg *rw = w; 

485 rw->w_needed += len; 

486 if (rw->w needed <= 0 && rw->w where) ( 
487 if (rw->w tmemsize < len) { 

488 if (rw-»w tmem) 

489 ` free (rw->w_tmem, M_RTABLE); 
490 if (rw->w_tmem = (caddr_t) 

491 mal loc (len, M RTABLE, M, NOWAIT)) 
492 rw->w_tmemsize = len; 

493 } 

494 if (rw-»w tmem) { 

495 Cp - rw-»w tmem; 

496 second time - 1; 

497 goto again; 

498 } else 

499 rw->w where = 0; 

500 } 

501 } 

502 if (cp) { 

503 struct rt msghdr *rtm = (struct rt msghdr *) CDU : 
504 rtm->rtm_version = RTM VERSION; 

505 rtm->rtm_type = type; 

506 rtm->rtm_msglen = len; 

507 } 

508 return (len); 

509 } 


— 7 —— y — - 9<ssxYí -FTrtsock.c 







































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































U 19-33 rt meaz 000000000 walkarg 
483-484 walkarg if 
second time 0 if 1 
19-32 again cp w 
cp 
3. 
485-486 w_needed 0 sysctl 
500 w needed -500 
w_where 
w_where systcl 
w_where rt_msg2 
rt_msg2 again 
19-34 
4. 
487-493 w_tmemsizel] w_tmem sysctl_rtable 0 
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TCP/IP 2 
sysctl rt_msg2 
000 cp w w.w_where | second_time O 
route_output 000000 
000000 
O U D O 0 00000000 
sysctl rtable U DO DO 0 uggaaggagagad 
U U U U U U 0000000000 
U 19-34 rt msg2 [00000000 
5. 
494-499 w_tmemsize cp 
second_time 1 again second_time 1 
df w tmem 
alloc 
6. 
502-509 cp 











19.14 sysctl_rtable|] |] 





















































































































































































































































































































































sysctl 18-11 net_sysctl 
19-35 
arp 
int mib[6]; 
size t needed; 
char *buf, *lim, *next; 
struct rt msghdr  *rtm; 
mib[0] - CTL NET; 
mib[1] = PF, ROUTE; 
mib[2] = 0; 
mib[3] = AF INET; /* address family; can be 0 */ 
mib[4] = NET RT FLAGS; /* operation */ 
mib[5] = RTF LLINFO; /* flags; can be 0 */ 
if (sysctl(mib, 6, NULL, &needed, NULL, 0) « 0) 
quit("sysctl error, estimate"); 
if ( (buf = malloc(needed)) == NULL) 
quit ("malloc"); 
if (sysctl(mib, 6, buf, &needed, NULL, 0) « 0) 


quit("sysctl error, retrieval"); 


lim - buf 4 needed; 
for (next - buf; next « lim; next «- rtm-»rtm msglen) ( 
- (struct rt msghdr *)next; 

/* do whatever */ 


rtm 


[] 19-35 
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mib sysctl_rtable 

mib[4] 3 

1) NET_RT_DUMP mib[3] 0 

RTM_GET 
rt_key|| rt gatewayl| rt_netmask 

rt genmask 

2) NET RT FLAGS mib [5] RTF xxx| ( 18-25) 

3) NET RT IFLIST mib [5] 

if index ifnet 

RTM IFINFO 
RTM NEWADDR if addrlist ifaddr 
mib [3] 0 RTM NEWADDR| mib[3] 
mib[3][] 0 
SIOCGIFCONF ioct[]4-26) 
sysctl 
19- 
35 sysctl malloc sysctl 
sysctl ( 
) lim 
rtm msglen 
19-36 Net /3 mib 


























































































































































































































CTL_NET 
PF_ROUTE 
0 
AF_INET 


RTF_LLINFO 







































































































































































































































































































































































































































































































































































Internet mib[3] AF_INET gated | 
mib[3] 0 
19-37 sysctl_xxx 
19-38 sysctl_rtable 
























































705-719 sysctl new 
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TCP/IP 2 
720-721 namelen 3 name 
name [0] ( mib[3])[] name [1] (mib[4]) 
(mib[5]) 
sysctl 
au 


















00000 


U U 
UU 
00 


E? SE 
Ej ves 
oO oOo 
E E E 


0 19-37 OOO 


























O00000 


name [2] 


mei m A A A ok 


705 int 


706 sysctl_rtable (name, namelen, where, given, new, newlen) 


707 int 
708 int 


*name; 
namelen; 


709 caddr_t where; 
710 size_t *given; 
711 caddr_t *new; 

712 size t newlen; 


713 ( 
714 
715 
716 
717 


718 
719 


720 
721 
722 
723 


struct radix_node_head *rnh; 
int i, s, error = EINVAL; 
u_char af; 

struct walkarg w; 


if (new) 
return (EPERM); 
if (namelen != 3) 
return (EINVAL); 
af = name[0]; 
Bzero(&w, sizeof(w)): 


H 19-38 sysctl rtable [0000 sysctl 000000 
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724 w.w_where = where; 

725 w.w_given = *given; 

726 w.w_needed = 0 - w.w_given; 

727 w.w_op = name[1]; 

728 w.w arg = name [2] ; 

729 S = splnet(); 

730 switch (w.w op) ( 

731 case NET RT DUMP: 

732 case NET RT FLAGS: 

733 for (i = 1; i <= AF MAX; i++) 

734 if ((rnh = rt tables[i]) && (af == || af == i) && 

735 (error = rnh-»rnh walktree (rnh, 

736 Sysctl dumpentry, &w))) 

737 break; 

738 break; 

739 case NET RT IFLIST: 

740 error = sysctl_iflist (af, &w); 

741 } 

742 splx(s); 

743 if (w.w_tmem) 

744 free (w.w_tmem, M RTABLE); 

745 w.w_needed += w.w_given; 

746 if (where) { 

747 *given = w.w_where - where; 

748 if (*given < w.w_needed) 

749 return (ENOMEM) ; 

750 } else { 

751 *given = (11 * w.w_needed) / 10; 

752 } 

753 return (error); 

754 3 

rtsock.c 
U 19-38 (0) 
2. walkarg 
723-728 walkarg ([] 19-31) 0 w where 
w given ([] w where 
) 
w needed w op ( NET RT xxx)[] w_arg 
3. 
731-738 NET RT DUMP|| NET RT FLAGS 
(rt table ) 0 
rnh walktree 18- 
17 rnh walktree rn walktree 
(sysctl dumpentry) 
rn walktree 

sysctl dumpentry walkarg 





















































sysctl 





514 





TCP/IP 2 














































































































China-pub.com 





























ifnet 


















































































































































































































































4. 
739-740 NET RT IFLIST sysctl_iflist 
5. 
743- 744 rt_msg2 
6. w_needed 
745 rt msg2 w needed 
w given 



























































w needed = 0 - 



































w given + totalbytes 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































totalbytes rt msg2 w needed 
w given 
w needed = 0 - w given + totalbytes + w given 
- totalbytes 
w given w where 
w given 19-35 needed 
7. 0 
746-749 [| where given 0 
8. 
750-752 where 
sysctl 10%[] 10% 
19.15 sysctl_dumpentry|] |] 
sysctl_rtable rn_walktree 
19-39 
623-630 radix_node 
rtentry sysctl_rtable | walkarg 
1. 
631-632 (mib[5]) rt flags 
19-36 arp RTF LLINFO 
ARP 
2. 
633-638 rti info U U U dst[] gate 
netmask|| genmask rt_msg2 
RTM_GET 
3. 
639-651 rt_msg2 
w_tmem copyout 
w_where 
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7 rtsock.c 
623 int 
624 sysctl_dumpentry (rn, w) 
625 struct radix_node *rn; 
626 struct walkarg *w; 
627 I 
628 struct rtentry *rt = (struct rtentry *) rn; 
629 int error = 0, size; 
630 struct rt addrinfo info; 
631 if (w->w_op == NET RT FLAGS && !(rt-»rt flags & w->w_arg)) 
632 return 0; 
633 bzero((caddr t) & info, sizeof(info)); 
634 dst = rt key (rt); 
635 gate - rt-»rt, gateway; 
636 netmask = rt_mask (rt); 
637 genmask = rt->rt_genmask; 
638 size = rt_msg2 (RTM_GET, &info, 0, w); 
639 if (w->w_where && w->w_tmem) { 
640 struct rt msghdr *rtm = (struct rt msghdr *) w->w_tmen; 
641 rtm->rtm_flags = rt->rt_flags; 
642 rtm->rtm_ use = rt->rt_use; 
643 rtm->rtm_rmx = rt->rt rmx; 
644 rtm->rtm index = rt->rt ifp->if index; 
645 rtm->rtm_errno = rtm->rtm_pid = rtm->rtm seq = 0; 
646 rtm->rtm_addrs = info.rti_addrs; 
647 if (error = copyout((caddr t) rtm, w->w where, size)) 
648 w->w where = NULL; 
649 else : 
650 w-»w where += size; 
651 H 
652 return (error); 
653 } 
rtsock.c 
U 19-39 sysctl dumentry  []l]U U U B LU LI U D 0 
19.16 sysctl iflist[|[] 
19-40 sysctl rtable 
for ifnet 
while ifaddr 
RTM_IFINFO RTM_NEWADDR 
1. 
654-666 (U 19-36 mib[5]) 
if_index 
2. 
667-670 RTM_IFINFO ifpaddr 
RTM_IFINFO rt msg2 info ifpaddr 0 
info RTM NEWADDRI||| 
3. 
671-681 if_msghdr copyout 

































































































































































516. + 
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w_where 














654 int 


rtsock.c 


655 sysctl_iflist (af, w) 


656 int 


af; 


657 struct walkarg *w; 


658 { 
659 
660 
661 
662 


663 
664 
665 
666 
667 
668 
669 
670 
671 
672 


673 
674 
675 
676 
677 
678 
673 
680 
681 
682 
683 
684 
685 
686 
687 
688 
689 
690 


691 
692 
693 
694 
695 
696 
697 
698 
699 
700 
701 
702 
703 
704 } 


struct ifnet *ifp; 
struct ifaddr *ifa; 
struct rt_addrinfo info; 
int len, error = 0; 


bzero((caddr_t) & info, sizeof (info)); 


for (ifp = ifnet; ifp; ifp = ifp->if next) I 
if (w->w_arg && w->w_arg != ifp->if index) 
continue; 


ifa = ifp->if_addrlist; 


ifpaddr 


= ifa->ifa_addr; 


len = rt_msg2(RTM_IFINFO, &info, (caddr_t) 0, w); 


ifpaddr 


= 0; 


if (w->w_where && w->w_tmem) { 
struct if_msghdr *ifm; 


ifm = (struct if_msghdr *) w->w_tmem; 
ifm->ifm_index = ifp->if_index; 
ifm->ifm_flags = ifp->if_flags; 
ifm->ifm_data = ifp->if_data; 
ifm->ifm addrs = info.rti addrs; 


if 


(error = copyout ((caddr_t) ifm, w->w where, len)) 
return (error); 


w->w_where += len; 


} 


while (ifa = ifa->ifa_next) { 


if 


(af && af != ifa->ifa_addr->sa_family) 
continue; 


ifaaddr = ifa->ifa_addr; 

netmask = ifa->ifa_netmask; 

brdaddr = ifa->ifa_dstaddr; 

len = rt_msg2 (RTM_NEWADDR, &info, 0, w); = 


if 


} 
) 


(w->w where && w->w_tmem) ( 
struct ifa msghdr *ifam; 


ifam = (struct ifa msghdr +) w->w_tmem; 

ifam->ifam index = ifa->ifa ifp->if index; 

ifam->ifam flags = ifa->ifa flags; 

ifam->ifam metric = ifa->ifa metric; 

ifam->ifam addrs = info.rti addrs; 

if (error = copyout (w->w tmem, w->w_where, len)) 
return (error); 

w-»w where += len; 


ifaaddr = netmask = brdaddr = 0; 


) 
return (0): 


— ———-————_—II—— n —[ MqLAaAaÇKN — < — — — —— rtsock.c 


U 19-40 sysctliflist UD 00000 0 0 0 0 0 0 





4. 

















































































































682-684 











































































































ifaddr (O 19-36 








































































































19 517 


















































mib[3]) 
J: 
685-688 rt_msg2 




















































































































RTM_NEWADDR 









































































































































ifaddr|| netmask|] brdaddr 







































































































































































































































































































































































































































































6. 
689-699 ifa_msghdr copyout 
w_where 
701 info[] U 0 
19.17 00 


























































































































































































































































































































(O routed[] gated) 



































































































































sysctl 


















































































































































































































































































































































































































































U U 





19.1 RTF DYNAMIC[] RTF MODIFIED 






































































































































19.2 













































































bsdi $ route add default -cloning -genmask 255.255.255.255 sun 




















19.3 15[] ARP 20 













































































sysctl 































































































paw 0000 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































20.1 ID 
O (routing domain) [] 0 U U 0 LU 
socket O PF ROUTE SOCK RAWI|] DI 
| 
1) RTM ADD 
2) RTM DELETE E 
3) RTM GET 
4) RTM CHANGE (UI) 
5) RTM LOCK | 
| i 0 
LU U U U U LU LU LU 
(route output) (raw input) 
| | 
20.2 routedomain[| protosw|] |] 
UU | | IO! | UI | | 
SOCK RAW[] | | | | 
20-1 O O routedomai PF ROUTE[][] domain 
[] [] [] U [] 
dom family PF ROUTE gut 
dom name route O O 
dom_init route_init NO OD DO O0 18-30 
dom_externalize 0 0020000000 
dom dispose 0 0000000 
dom_protosw routesw OOOOOOGO 20-2 
dom_protoswNPROTOSW 000000000000 
dom nezt [| domaininit 9 O O 7-15 
dom_rtattch DU DDD DDD 
dom rtoffset 000000 0 
dom_maxrtkey U D D D D D 0 
O 20-1 routedomain 00 
(TCP UDP[] ICMP[] )[] Internet Ut 
SOCK RAW | 0 20-2 | PF ROUTE 
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O 0 routesw[0] U U 
pr_type SOCK_RAW "DUDU 
pr domain &routedomain 00000 
pr protocol 0 
pr_flags PR_ATOMI| PR_ADDR DOOOOOOOOOOOODO 
pr input raw input 000000 raw input 000 
pr output route output PRU SEND OOOO 
pr ctlinput raw ctlinput U D D D D 
pr ctloutput 0 U 0 D 
pr usrreq route usrreq U D D D DDD DDD D 0 
pr_init raw_init [1 D D 
pr fasttimo 0 OOO 
pr_slowtimo 0 OOO 
pr_drain 0 O D D 
pr_sysctl sysctl_rtable OO sysct1(830 0 0 O 
































0 202 0000 protosw [ D D 


20.3 00000 


































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































socket (PF_ROUTE, SOCK_RAW, protocol); 
(route usrreq)[] PRU ATTACH 
protocol 
protocol AF INET Internet 
protocol 0 
(raw control block) 
32 IP 
20-3 rawcb[] [] 
raw cb.h 
39 struct rawcb { å us 
40 Struct rawcb *rcb next; /* doubly linked list */ 
41 struct ràwcb *rcb prev; 
42 struct socket *rcb socket; /* back pointer to socket */ 
43 Struct sockaddr *rcb faddr; /* destination address */ 
44 struct sockaddr *rcb laddr; /* socket's address */ 
45 struct sockproto rcb proto; /* protocol family, protocol */ 
46 ); 
47 #define sotorawcb(so) ((struct rawcb *)(so)-»so pcb) 
raw cb.h 
[] 20-3 rawcb [] [| 
| rawcb 20-4 
39-47 19-26 sockproto sp. family 
PF ROUTE sp protocol] U socket|] | 0 
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TCP/IP 2 
rcb_faddr route_src 19-26 
route_src|| rcb_laddr 
000 ooo 
file() filet) 
DTYPE SOCKET f type 
f data 
socket () 
sock RAN so type 
so. pcb 
Ba ee EA DUDU. 
rawcb{} raweb{} 000 
rcb prev 
00000000 
4---- - - - - -- - --- EE > 
O0000000 
020-4 Odo Dodo o 00000000 
20.4 raw init[|[] 
20-5 raw init 20-2 protosw 
18-29 
38-42 
- raw usrreq.c 
38 void 
39 raw init() 
40 I 
41 rawcb.rcb next = rawcb.rcb_prev = &rawcb; 
423 
raw_usrreg.c 


Q 20-5 raw iit [000000000000000 


20.5 route output) [] 





18-11 



























































































































































PRU, SEND 
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18-9 



























































route output 











































































































































































































































































































) sosend mbuf 20-6 


























































































































































































































RTM_ADD ( 

















































































































raw_input 


00000 









rtm_addrs 0x07 


rt msghdr() 


IE 
= = 
EI ES] 





DO O IPD] O 
sockaddr_in() 











DO O TP] O 
sockaddr in() 










(0000 
sockaddr_in{} 














rt addrinfo() 


0x07 










[] rtm_addrs H D Ü 
NULL OO r_adarsO D 0 D] 
NULL 


NULL 
NULL 
NULL 









0206 0000000 asma» [00000000 






































route_output 








































































































rt_addrinfo 























































































































RTAX 
° rtm_addrs rt_msghdr 
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0x07 
(U 19-19)[]] RTM ADD 
genmask 
write (sosend ) | mbuf 
sm copydatal| mbuf route output malloc 
mbuf 
*route output rt xaddrs 
rt addrinfo route output 19-19 
rti addrs 
*route output rt msghdr errno 
rtm_errnol]( EEXIST) 
RTF_DONE rtm_flags 
*rt msghdr 0 
m copyback mbuf raw input PCB 
SO USELOOPBACK 




















































































































































































































route 






















































































0 shutdown 









































































































































route output 20-7 
















































































int 

route output () 

L 
R Malloc() to allocate buffer; 
m copydata() to copy from mbuf chain into buffer; 
rt xaddrs() to build rt addrinfo(); 


switch (message type) { 

case RTM ADD: 
rtrequest(RTM ADD); 
rt setmetrics(); 
break; 


case RTM DELETE: 


rtrequest(RTM DELETE); 
break; 


case RTM GET: 

case RTM CHANGE: 

case RTM LOCK: 
rtallocl(); 


switch (message type) ( 
case RTM GET: 
rt msg2 (RTM GET); 
break; 


case RTM CHANGE: 
[] 20-7 route output [00000 
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change appropriate fields; 
/* fall through */ 


case RTM LOCK: 
set rmx locks; 
break; 


} 
break; 


} 
set rtm_error if error, else set RTF DONE flag; 


m_copyback() to copy from buffer into mbuf chain; 
















































































raw input (); /* mbuf chain to appropriate processes +/ 
3 
[] 20-7 (0) 
route output 20-8 
I rtsock.c 
. 113 int 


114 route, output (m, so) 
115 struct mbuf *m; 
116 struct socket *so; 


117 ( 

118 struct rt_msghdr *rtm = 0; 

119 struct rtentry *rt = 0; 

120 struct rtentry *saved_nrt = 0; 

121 struct rt_addrinfo info; 

122 int len, error = 0; 

123 struct ifnet *ifp = 0; 

124 struct ifaddr *ifa = 0; 

125 #define senderr(e) { error = e; goto flush;) 
126 if (m == Il ((m-»m len < sizeof(long)) && 
127 (m = m_pullup(m, sizeof(long))) == 0)) 
‘128 return (ENOBUFS) ; 

129 if ((m->m_flags & M_PKTHDR) == 0) 

130 panic("route output"); 

131 len - m-»m pkthdr.len; 

132 if (len < sizeof(*rtm) || 

133 len != mtod(m, struct rt msghdr *)-»rtm msglen) ( 
134 dst - 0; 

135 senderr (EINVAL) ; 

136 } 

137 R_Malloc (rtm, struct rt msghdr +, len); 

138 if (rtm == 0) ( 

139 dst = 0; 

140 senderr (ENOBUFS) ; 

141 } 

142 m_copydata(m, 0, len, (caddr_t) rtm); 

143 if (rtm->rtm version != RTM_VERSION) { 

144 dst = 0; 

145 senderr (EPROTONOSUPPORT) ; 

146 } 

147 rtm->rtm pid = curproc-»p pid; 

148 info.rti_addrs = rtm->rtm_addrs; 

149 rt, xaddrs((caddr t) (rtm + 1), len + (caddr t) rtm, &info); 


0 20-8 route output D 0 0 0 0 D 0 0 0 0 mbufll D 0 0 0 U 
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150 if (dst == 0) 
151 senderr (EINVAL) ; 
152 if (genmask) { 
153 struct radix_node *t; 
154 t = rn_addmask((caddr_t) genmask, 1, 2); . 
155 if (t && Bcmp(genmask, t->rn key, *(u char zi genmask) == 0) 
156 genmask = (struct sockaddr *) (t->rn_key); 
157 else 
158 senderr (ENOBUFS) ; 
159 } = rtsock.c 
O 20-8 (0) 
1. mbu 
113-136 mbuf rt_msghdr mbuf 
rtm_msglen 
2; 
137-142 m_copydata mbu 
3. 
143-146 
147-149 ID rtm_pid 
info.rti_addrs rt xaddrs([] JO info 8 
4. 
150-151 info.rti info[RTAX DST] 
EINVAL dst (U 19-19) 
5: genmask 
152-159 genmask RTF_CLONING (O 19-8) 
rn_addmask 
genmask 
genmask 
20-9 route_output RTM_ADD[] RTM DELETE 
162-163 RTM ADD 
164-165 rtrequest netmask 
OK saved nrt 
166-172 rt_metrics 1 
genmask ( ) 
173-176 RTM_DELETE rtrequest 
O[] rtrequest rtfree 
([] 19-7) 
20-10 RTM GET|| RTM CHANGE|| RTM LOCK 
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: rtsock.c 
160 switch (rtm->rtm_type) { 
161 case RTM_ADD: 
162 if (gate == 0) 
163 senderr (EINVAL); 
164 error = rtrequest (RTM_ADD, dst, gate, netmask, 
165 rtm->rtm flags, &saved nrt); 
166 if (error == 0 && saved nrt) ( 
167 rt_setmetrics (rtm->rtm_inits, 
168 &rtm->rtm rmx, &saved nrt->rt rmx); 
169 saved nrt->rt refcnt--; 
170 saved nrt->rt genmask = genmask; 
171 } 
172 break; 
173 case RTM_DELETE: 
174 error = rtrequest (RTM_DELETE, dst, gate, netmask, 
175 rtm->rtm flags, (struct rtentry **) 0); 
176 break; 
rtsock.c 
[] 20-9 route output [| [| [| [| [| RIM ADD [| RIM DELETE [] [] 
rtsock.c 
177 case RTM GET: 
178 case RTM CHANGE: 
179 case RTM LOCK: 
180 rt = rtallocl(dst, 0); 
181 if (rt == 0) 
182 senderr (ESRCH) ; 
183 if (rtm->rtm type != RTM GET) { /* XXX: too grotty */ 
184 struct radix node *rn; . 
185 extern struct radix node head *mask rnhead; 
186 if (Bcmp(dst, rt key(rt), dst-»sa len) != 0) 
187 senderr (ESRCH) ; 
188 if (netmask && (rn = rn search(netmask, 
189 . mask rnhead->rnh treetop))) 
190 netmask = (struct sockaddr *) rn->rn key; 
191 for (rn = rt->rt_nodes; rn; rn = rn->rn dupedkey) 
192 if (netmask == (struct sockaddr *) rn->rn mask) 
193 break; 
194 if (rn == 0) 
195 senderr (ETOOMANYREFS) ; 
196 rt = (struct rtentry *) rn; 
197 } 
rtsock.c 
O 20-10 route output [J [| [| RIM GET [] RTM CHANGE [| RMIOK [000000 
6. 
177-182 rtallocl 
ESRCH 
T. 
183-187 RTM CHANGE|| RTM LOCK 
dst 
ESRCH 





















































526 


China-bubcom 























































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
8. 
188-193 
netmask (mask_rnhead) 
netmask 
rn_mask netmask 
for 
netmask[] rn mask ( 
) netmask 
194-195 for ETOOMANYREFS 
XXX 
rtallocl rtallocl 
RTM_GET 20-11 




















































































































































































































































































































































































































































































































































































































—— m m risock.c 
switch (rtm->rtm_type) { 


198 


199 
200 
201 
202 
203 
204 
205 
206 
207 
208 
209 
210 
211 
212 
213 
214 
215 
216 
217 
218 
219 
220 
221 
222 
223 
224 
225 
226 
227 
228 
229 
230 





case RTM_GET: 


dst = rt_key (rt); 

gate = rt->rt_gateway; 

netmask = rt_mask (rt); 

genmask = rt->rt_genmask; 

if (rtm->rtm_addrs & (RTA_IFP | RTA_IFA)) { 

if (ifp = rt->rt_ifp) (í 

ifpaddr = ifp->if_addrlist->ifa_addr; 
ifaaddr = rt->rt_ifa->ifa_addr;. 
rtm->rtm index = ifp->if_index; 


} else { 
ifpaddr = 0; 
ifaaddr = 0; 
} 


} 
len = rt msg2 (RTM GET, &info, (caddr t) 0, 
(struct walkarg *) 0); 
if (len > rtm->rtm_msglen) { 
struct rt msghdr *new_rtm; 
R_Malloc (new_rtm, struct rt msghdr *, len); 
if (new rtm == 0) i ` 
senderr (ENOBUFS) ; 
Bcopy (rtm, new rtm, rtm-»rtm msglen); 
Free(rtm); : 
rtm = new_rtm; 
} ER 
(void) rt_msg2 (RTM_GET, &info, (caddr_t) rtm, 
i (struct walkarg *) 0); 
rtm->rtm flags = rt->rt flags; 
rtm->rtm_rmx = rt->rt_rmx; 
rtm->rtm_addrs = info.rti_addrs; 
break; ; 


ri 


rtsock.c 





0 20-11 route output [] 00 RMceT [000 
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route_output 
































































































































































































































































































































20-6 m_copydata 








































































































198-203 rti_info dst|| gatel netmask|| genmask 































































































































































































info 





























10. 
204-213 rtm_flags RTA IFP[| RTA IFA 
ifaddr 
(U rt_ifp->addrlist ) (| rt_ifa->ifa_addr ) 










































































































































































































































































































































































































































































214-224 rt msg2 RTM GET info 




















































































































































































































rtm 




































































































































































225-230 rt msg2 

















































































































rt msghdr[]|[] 

20-12 RTM CHANGE|[| RTM LOCK 
12. 

231-233 gate rt_setgate 
13. 

234-244 ( ) rt_ifp[] rt ifa 

ifpaddr ifaaddr | 






























































































































































































































































































































































































































































































































































































































































rt_ifpl] rt ifa 











14. 
245-256 (ifa ) rt_ifa 
rt ifpl| rt ifa 






































































































































































































































































































































































































































































































































































































































15. 
257-258 rt setmetrics 
16. 
259=260 RTM ADD 
17. 
261-262 genmask 20-8 













































































































































































































































































































































































rt genmask 
18. 
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266-270 RTM_LOCK rt_rmx.rmx_locks 20-13 
rtsock.c 
231 case RTM_CHANGE: 
232 if (gate && rt_setgate(rt, rt_key(rt), gate)) 
233 senderr (EDQUOT) ; 
234 /* new gateway could require new ifaddr, ifp; flags may also be 
235 different; ifp may be specified by 11 sockaddr when protocol 
236 address is ambiguous */ 
237 if (ifpaddr && (ifa = ifa_ifwithnet (ifpaddr)) && 
238 (ifp = ifa->ifa_ifp) ) 
239 ifa = ifaof_ifpforaddr(ifaaddr ? ifaaddr : gate, 
240 ifp); : 
241 else if ((ifaaddr && (ifa = ifa ifwithaddr(ifaaddr))) |l. 
242 (ifa - ifa ifwithroute(rt-»rt flags, 
243 rt key(rt), gate))) 
244 ifp - ifa-»ifa ifp; 
245 if (ifa) { 
246 struct ifaddr *oifa - rt-»rt ifa; 
247 if (oifa !- ifa) ( : 
248 if (oifa && oifa->ifa rtrequest)- 
249 oifa->ifa_rtrequest (RTM DELETE, 
250 rt, gate); 
251 IFAFREE(rt-»rt ifa); 
. 252 rt-»rt ifa - ifa; 
253 ifa->ifa_refcnt++; 
254 rt->rt_ifp = ifp; 
255 } 
256 } 
257 rt_setmetrics(rtm->rtm_inits, &rtm->rtm_rmx, 
258 &rt->rt rmx); i 
259 if (rt-»rt ifa && rt->rt_ifa->ifa_rtrequest) 
260 rt-»rt ifa-»ifa rtrequest(RTM ADD, rt, gate); 
261 if (genmask) 
262 rt-»rt genmask - genmask; 
263 /* 
264 * Fall into 
265 */ 
266 case RTM LOCK: 
267 rt-»rt rmx.rmx locks &= ^(rtm-»rtm inits); 
268 rt-»rt rmx.rmx locks |- å 
269 (rtm-»rtm inits & rtm->rtm rmx.rmx locks); 
270 break; 
271 } 
272 break; 
273 default: 
274 senderr (EOPNOTSUPP) ; 
275 } 
rtsock.c 
0 20-12 route output [D [| [| RIM CHANGE [| RIMICK OOOO 
rt metrics rmx_locks 
rmx_locks 
TCP 27-3 rmx pksent 
rtm inits 
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U U U [] U 
RTV MTU 0x01 0000000 ms mtu 
RTV_HOPCOUNT 0x02 0000000 rmx. hopcount 
RTV EXPIRE 0x04 0000000 rmx expire 
RTV_RPIPE 0x08 0000000 rmx_recvpipe 
RTV_SPIPE 0x10 000000 0 rmx. sendpipe 
RTV_SSTHRESH 0x20 0000000 rmx ssthresh 
RTV_RTT 0x40 0000000 rmx_rtt 
RTV_RTTVAR 0x80 0000000 ms rttvar 
020-13 [D [I BO U B D UE U U U LI I 

rt setmetrics rtm rmx.rmx locks 

rt rmx.rmx locksl] 

















































































































































































































































































































































































































































































































































































































































































































(rtm inits) 
(rtm inits) (rtm rmx.rmx locks) 
273-275 default 20-9 switch 
route output 20-14 raw input[] 
rtsock.c 
276 flush: 
277 if (rtm) { 
278 if (error) 
279 rtm->rtm_errno = error; 
280 else 
281 rtm->rtm_flags |= RTF_DONE; 
282 } 
283 if (rt) 
284 rtfree (rt); 
285 { 
286 struct rawcb *rp = 0; 
287 /* 
288 * Check to see if we don't want our own messages. 
289 */ 
290 if ((so->so_options £ SO_USELOOPBACK) == 0) 1 
291 if (route cb.any count <= 1) { 
292 if (rtm) 
293 Free(rtm); 
294 m freem(m); 
295 i return (error); 
296 } 
297 /* There is another listener, so construct message */ 
298 rp = sotorawcb (so); 
299 } 
300 if (rtm) { 
301 m_copyback (m, 0, rtm->rtm_msglen, (caddr_t) rtm); 
302 Free (rtm); 
303 } 
304 if (rp) ; 
305 rp->rcb_proto.sp_family = 0; /* Avoid us */ 
306 if (dst) 
307 route_proto.sp_protocol = dst->sa family; 
308 raw_input (m, &route_proto, &route_src, &route_dst); 


O 20-14 route output 2000000000 raw input 


530 


























































































































Chinaspub.tol 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
309 if (rp) I 
310 rp->rcb_proto.sp_family = PF ROUTE; 
311 } 
312 return (error); 
ed rtsock.c 
0 20-14 (D) 
19. OK 
276-282 flush senderr 
| rtm_errno RTF_DONE | 
20. 
283-284 20-10 rtallocl 
21. 
285-296 SO_USELOOPBACK|] 
( RTM GET 
) 1 
mbuf 
22. 
297-299 rp 
23. mbu 
300-303 mbuf[] (U) 20-6) 
24. 
304-305 rp 
sp_family 0 sp_family(route_proto 
19-26[] ) PF_ROUTE raw_input 
raw_input sp family[] 0 
25. | 
306-308 dst 
Internet PF INET raw input 
309-313 sp family 0 PF ROUTE 
20.6 rt xaddrs[l |] 
mbuf 
(rtm addrs) rt addrinfo rti info route output 
rt xaddrs (O 20-8)[] rt. xaddrs 
rti info 20-15 
330-340 0 
341-347 8[] (RTM. MAX) ( ) 
| | rti info ADVANCE sa len 



















































































































































































China=pub.tom 0 531 







































































































































































4 cp 
S — rtsock.c 

330 #define ROUNDUP (a) \ 
331 (fa) > 0 ? (1 + (((a) - 1) | (sizeof(long) - 1))) : sizeof(long)) 
332 #define ADVANCE(x, n) (x += ROUNDUP( (n)-»sa, len)) 
333 static void 
334 rt xaddrs(cp, cplim, rtinfo) 
335 caddr t cp, cplim; 
336 struct rt addrinfo *rtinfo; 
337 ( 
338 struct sockaddr *sa; 
339 int i: 
340 bzero(rtinfo-»rti info, sizeof (rtinfo->rti_info)); 
341 for (i = 0; (i < RTAX MAX) && (cp < cplim); i++) ( 
342 if ((rtinfo-»rti addrs & (1 << i)) == 0) 
343 continue; 
344 rtinfo-»rti info[i] - sa - (struct sockaddr *) cp; 
345 ADVANCE(cp, sa); 
346 } 
= risock.c 


[] 20-15 rt_xaddrs [000000 vi info [J 


20.7 rt, setmetrics[]|[] 

















































































































route output 















































rtm inits rtm rmx 


20-13 




































































































































































rtm addrs 

































































rt metrics 





























































































































































































































































































































































































































rt msghdr —— || rtm inits 
20-16 rt setmetrics 

314 void roche 

315 rt setmetrics(which, in, out) 

316 u long which; 

317 struct rt, metrics *in, *out; 

/ 318 ( 

319 #define metric(f, e) if (which & (f)) out->e = in-»e; 

320 metric(RTV RPIPE, rmx recvpipe); 

321 metric(RTV SPIPE, rmx sendpipe); 

322 metric(RTV SSTHRESH, rmx ssthresh); 

323 metric(RTV RTT, rmx rtt); 

324 metric(RTV RTTVAR, rmx rttvar); 

325 metric(RTV HOPCOUNT, rmx hopcount); 

326 metric(RTV MTU, rmx mtu); 

327 metric(RTV EXPIRE, rmx expire); 

328 #undef metric 

329 ) . 
rtsock.c 





D 20-16 rt setmetrics 00000 rt metrics 000000 


532 
































China-pubscon 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
314-318 which rtm_inits in FE 
metrics out rt metrics 
3419-329 8 
RTM ADD route output rtrequest 
oU 19-9) 0 
20.8 raw input[|[] 
raw input 18-11 raw input 
PF ROUTE socket 0 
AF INET 
(20.3[] ) 
rcb proto Sp family|| sp protocol 
20-17 raw input 
51 void raw usrreg.c 
52 raw input (m0, proto, src, dst) 
53 struct mbuf *m0; 
54 struct sockproto *proto; 
55 struct sockaddr *src, *dst; 
56 ( 
57 struct rawcb *rp; 
58 struct mbuf *m = m0; 
59 int Sockets - 0; 
60 struct socket *last; 
61 last = 0; 
62 for (rp = rawcb.rcb next; rp !- &rawcb; rp = rp-»rcb next) ( 
63 if (rp-»rcb proto.sp family !- proto-»sp. family) 
64 continue; 
65 if (rp-»rcb proto.sp protocol && 
66 rp-»rcb proto.sp protocol !- proto-»sp protocol) 
67 continue; 
68 FE 
69 * We assume the lower level routines have 
70 * placed the address in a canonical format 
71 * suitable for a structure comparison. 
72 * 
73 * Note that if the lengths are not the same 
74 * the comparison will fail at the first byte. 
75 x: 
76 #define equal (al, a2) N 
77. (bcmp((caddr t) (al), (caddr t)(a2), al->sa len) == 0) 
78 if (rp->rcb laddr && !equal(rp->rcb_laddr, dst)) 
79 continue; 
80 if (rp->rcb faddr && !equal(rp->rcb faddr, src)) 
81 continue; 
82 if (last) { 
83 struct mbuf *n; 
84 if (n = m_copy(m, 0, (int) M COPYALL)) { 
85 if (sbappendadär (&last->so_rcv, src, 
86 n, (struct mbuf *) 0) == 0) 


0 20-17 raw input U UU 0 0 0 0 0 0 0 0 00 0 0 0 0 0 
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87 /* should notify about lost packet */- 
88 m_freem(n); 

89 else { 

90 sorwakeup (last); 

91 sockets++; 


94 ) 

95 last = rp-»rcb socket; 

96 } 

97 if (last) { 

98 if (sbappendaddr(&last-»so rcv, src, 

99 m, (struct mbuf *) 0) == 0) 
100 m freem(m); 
101 eise ( 
102 sorwakeup (last); 
103 sockets++; 

104 } 
105 } else 
106 m_freem(m); 
107 } : 


— — él. m yaw usrreq.c 


U 20-17 (0) 





































































































51-61 raw_input proto|| srcl| dst 










































































route protol] route src[| route dst 19-26 
































































































































1. 
62-67 for ( PF ROUTE) 























































































































































































































sockproto 













































































































































































(socket ) sockproto 
0 




























































































































































































2. 
68-81 






























































































































































rcb_laddr rcb_faddr bind 

















































































































connect Net/3 









































































































































































































































































































































route_usrreg route_src 







































































src 







































































82-107 last socket 








































































































































































































m copyl| sbappendaddr 

































































































































































last 
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m copy( ) 


















































N- 1 










































































socket 





























































































































































































































































































































































































































534 TCP/IP 2 


) 























































































































20.9 route usrreq[]|[] 


China-pubecom 



















































































route usrreq 
































20-18 





































































































TAA TCO rsockc 


64 int 
65 route usrreq(so, req, m, nam, control) 
66 struct socket *so; 


få 


67 int reg; 

68 struct mbuf *m, *nam, *control; 

69 ( 

70 int error = 0; i 
71 struct rawcb *rp = sotorawcb (so); 

72 int S; 

73 if (req == PRU ATTACH) { 

74 MALLOC (rp, struct rawcb *, sizeof(*rp), M PCB, M_WAITOK); 
75 if (so->so_pcb = (caddr t) rp) ` 
76 bzero(so->so pcb, sizeof(*rp)): 

77 . ) 

78 if (req == PRU DETACH && rp) { 

79 int af = rp->reb proto.sp protocol; 
80 if (af == AF INET) 

81 route cb.ip count--; 

82° else if (af == AF_NS) 

83 route_cb.ns_count--; 

84 else if (af == AF_ISO) 

85 route_cb.iso_count--; 

86 route_cb.any_count--; 

87 } 

88 S = splnet (1: 

89 error = raw usrreq(so, req, m, nam, 

90 rp = sotorawcb (so); 

91 . if (req == PRU_ATTACH && rp) ( 

92 int af - rp-»rcb proto.sp protocol; 
93 if (error) ( 

94. free((caddr t) rp, M PCB); 

95 splx(s); 

96 return (error); 

97 } 

98 if (af == AF_INET) 

99 route_cb.ip_count++; 
100 else if (af == AF_NS) 
101 route_cb.ns_count++; 
102 ~ else if (af == AF ISO) 
103 route_cb.iso_count++; 
104 ^ route cb.any.count++; 

105 rp-»rcb faddr = &route src; 

106 soisconnected(so); 

107 so->so options |= SO USELOOPBACK; 

108 } 

109 splx(s); 

110 return (error); 

111 3 





rtsock.c 


O 20-18 route usrreq 00000 PRI xxx] 0 
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1. PRU_ATTACH 
64-77 socket PRU_ATTACH 
MALLOC socket so_pcb | rawcb 
0 
2. PRU_DETACH 
78-87 close PRU_DETACH socket 
route_cb 1 any_count 
| 
3. 
88-90 raw usrreq PRU. xxx 
4. 
91-104 PRU ATTACH 
raw usrreq route cb 
any count 
5. 
105-106 route_src 
[| PF_ROUTE 
6. SO_USELOOPBACK 
107-111 SO_USELOOPBACK — 



































































































































































































































20.10 raw usrreq]| || 








































































































raw usrreq 






























































































































































route usrreq 


















































( OSI CLNP) raw usrreq route usrreql]| raw usrreq 



































pr usrreq 





























pr usrreq | 






























































































































































20-19 raw usrreq switch 



























































































































































































































































































































































































































































































































































































































































1. PRU. CONTROL 
119-129 PRU CONTROL ioctl 

2. 
130-133 ( sendmsg ) 

3. 
134-137 socket 

(U route usrreqg) 
so pcb 


























































































































262-269 | switch default|] | [] casel UDE | | PRU BIND 







































































536 em n: China=pub.tom 
ET HD 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































PRU CONNECT Net/3 
bind[] connect (panic) 
(bug) 
Tat HS C 
119 int METTE 
120 raw usrreq(so, req, m, nam, control) 
121 struct socket *so; 
122 int req; 
123 struct mbuf *m, *nam, *control; 
124 ( 
125 f struct rawcb *rp = sotorawcb(so); 
126 int error = 0; 
127 int len; 
128 if (req == PRU CONTROL) 
129 return (EOPNOTSUPP) ; 
130 if (control && control->m_len) ( 
131 error = EOPNOTSUPP; 
132 ' goto release; 
133 } 
134 if (rp == 0) L 
135 error = EINVAL; 
136 i goto release; 
137 } 
138 switch (req) { 
262 default: 
263 panic ("raw_usrreq"); 
264 } 
265 release: 
266 if (m != NULL) 
267 m freem (m); 
268 return (error); 
269 ) 
raw usrreq.c 
O 20-19 raw usrreg [OQ 
case 20-20 PRU ATTACH[] PRU. DETACH 
139-148 PRU ATTACH Socket 
149-150 raw attach([]| 20-24) nam 
Socket 
151-159 PRU DETACH close rp 
switch 
160-161 raw detach([] 20-25) 
20-21 PRU CONNECTO[] PRU. DISCONNECT[] PRU. SHUTDOWN 
186-188 PRU CONNECT2 Socketpair 
189-196 20-18) PRU DISCONNECT PRU. DETACH 
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139 Tx raw usrreg.c 
140 * Allocate a raw control block and fill in the 
141 * necessary info to allow packets to be routed to 
142 * the appropriate raw interface routine. 
143 */ 
144 case PRU_ATTACH: 
145 if ((so->so state £ SS_PRIV) == 0) { 
146 error = EACCES; ` 
147 break; 
148 } 
149 error = raw attach(so, (int) nam); 
150 break; 
151 /* 
152 * Destroy state just before socket deallocation. 
153 * Flush data or not depending on the options. 
154 X 
155 case PRU. DETACH: 
156 if (rp == 0) I 
157 error = ENOTCONN; 
158 break; 
159 } 
160 raw detach(rp); 
161 break; 
raw. usrreg.c 
[ 20-20 raw usrreq [][][] PRU ATTACH [| PRU DETACH [|] [] 
close 
raw disconnect|| soisdisconnected 
197-202 shutdown 
PRU. SHUTDOWN Socantsendmore 

186 case PRU, CONNECT2: BEES 
187 i error = EOPNOTSUPP; 
188 goto release; 
189 case PRU_DISCONNECT: 
190 if (rp->rcb faddr == 0) { 
191 error = ENOTCONN; 
192 break; 
193 } 
194 raw disconnect (rp); 
195 soisdisconnected (so); 
196 break; 
197 /* 
198 * Mark the connection as being incapable of further input. 
199 */ ' ES 
200 case PRU SHUTDOWN: 
201 socantsendmore (so); by 
202 break; u 








[ 20-21 raw usrreq [] U [ PRU_CONNECT2 [] PRU DISCONNECT [|] PRU SHUIDOWN [] [] 









































PRU_ABORT|| PRU. SENSE 20-22 











FU 
0 
Gq 
un 
Ei 
= 
el 














































































































































































































203-217 sosend PRU SEND nam 
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TCP/IP 2 
raw_usrreq.c 
203 {* à 
204 * Ship a packet out. The appropriate raw output 
205 * routine handles any massaging necessary... 
206 */ 
207 case PRU SEND: 
208 if (nam) { 
209 if (rp-»rcb faddr) { 
210 error = EISCONN; 
211 break; 
212 } 
213 rp->rcb_faddr = mtod(nam, struct sockaddr *); 
214 } else if (rp-»rcb faddr == 0) í 
215 error = ENOTCONN; 
216 break; 
217 ) 
218 error = (*so-»so proto-»pr output) (m, so); 
219 m - NULL; 
220 if (nam) 
221 rp-»rcb faddr - 0; 
222 break; 
223 case PRU, ABORT: 
224 raw disconnect (rp); 
225 sofree(so); 
226 Soisdisconnected(so); 
227 break; 
228 case PRU SENSE: 
229 /* 
230 * stat: don't bother with a blocksize. 
231 */ 
232 return (0); 
: raw_usrreq.c 
0 20-22 raw usrreq [] [| [| PRU SEND [| PRU ABORT [| PRU SENSE [| [| 
sendto sendmsg 
route usrreg rcb faddr 
218-222 m mbuf pr_output 
route_output 
223-227 PRU_ABORT 
228-232 fstat | PRU SENSE OK] 
20-23 PRU xxx 
raw usrreg.c 
233 /* 
234 * Not supported. 
235 */ 
236 case PRU RCVOOB: 
237 case PRU_RCVD: 
238 return (EOPNOTSUPP) ; 
239 case PRU LISTEN: 
240 case PRU, ACCEPT: 
241 case PRU_SENDOOB: 
242 error = EOPNOTSUPP; 
U 20-23 raw usrreq [000000 
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243 break; 
244 case PRU_SOCKADDR: 
245 if (rp->rcb laddr == 0) { 
246 error = EINVAL; 
247 break; 
248 } 
249 len = rp-»rcb laddr->sa: len; 
250 bcopy ((caddr_t) rp->rcb_laddr, mtod(nam, caddr t), (unsigned) len); 
251 nam->m len = len; 
252 break; 
253 case PRU PEERADDR: 
254 if (rp->rcb faddr == 0) { 
255 error = ENOTCONN; 
256 break; 
257 1 
258 len = rp->rcb_faddr->sa_len; 
259 bcopy((caddr t) rp->rcb_faddr, mtod(nam, caddr_t), (unsigned) len); 
260 nam->m_len = len; 
261 break; 
raw_usrreg.c 
U 20-23 (0) 
233-243 
244-261 PRU SOCKADDR|| PRU PEERADDR getsockname|| getpeername 
bind| 
route src route usrreq 
20.11 raw attach[| raw detach[] raw_disconnect|]| |] 
raw attach 20-24 raw input PRU ATTACH 
Ea raw_cb.c 
50 raw_attach(so, proto) 
51 struct socket *so; 
52 int proto; 
53 ( 
54 struct rawcb *rp = sotorawcb(so); 
55 int error; 
56 /* 
57 * It is assumed that raw attach is called 
58 * after space has been allocated for the 
59 * rawcb. L 
60 */ 
61 if (rp == 0) 
62 return (ENOBUFS); 
63 if (error = soreserve(so, raw_sendspace, raw_recvspace)) 
64 i return (error); 
65 rp->rcb socket = so; 
66 rp-»rcb proto.sp family = so-»so proto-»pr. domain-»dom family; 
67 rp-»rcb proto.sp protocol - proto; 
68 insque(rp, &rawcb); 
69 return (0); 
70:3 


= ee chic 
O 20-24 raw attach 00 


5 40 TCP/IP 2 
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49-64 soreserve 
8192 
65-67 socket dom_family( 20-1[] PF ROUTE) 
protol] [| (socket ) 
68-70 insque rawcb 
raw_detach 20-25 raw_input PRU_DETACH 
- raw cb.c 
75 void 
76 raw detach(rp) 
77! struct rawcb *rp; 
78 I 
79 struct socket *so = rp-»rcb socket; 
80 so->so_pcb = 0; 
81 sofree (so); 
82 remque (rp); 
83 free((caddr t) (rp), M PCB); 
84 ) I 
raw che 
O 20-25 raw detach |] [J 
75-84 socket] |] so pcb | | remquel]|[|] 
free 
raw_disconnect 20-26 raw_input PRU 
DISCONNECT|| PRU ABORT 
88-94 raw detach 
raw cb.c 
88 void 
89 raw disconnect (rp) 
90 struct rawcb *rp; 
91 ( 
92 if (rp-»rcb socket->so state & SS NOFDREF) 
93 raw detachirp): í 
94 } 
raw_cb.c 
[] 20-26 raw disconnect [0 
20.12 00 
PF_ROUTE 
sysctl 
( ) 
(PCB) 
rawcb 22 
UDP[] TCP IP Internet (inpcb) 
socket PCB rawcb inpcb 
socket PCB 
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route output |] 000000000000000000000000 raw input[] 
LU LU U U U U U U U U U U U U U DU 0 0 0 U LU U U U 0 U PRU xxx[] l] [] 
raw usrreq[] route usrreg U 000090 000000 xxx usrreq[] 
000000 (UDPU TCP[] POIOOOOOODO l] switch[] O 00000 
U U U U U L 
U U 

20.1 OU UUUUUUUUU L U U) U L U route output[] [] 

OU 000000 
20.2 [ [| routesw[] [| O pr_protocol| og 00 [] socket[] | g 






















































































O[] protocoll 0000 U! 
20.3 | U (U ARPIEI U 0 10 D U 0 D] U U O U UD 0 0 D D D D U 












































































































































D 2 








10 ARPQODOoODDO 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































21.1 HH 
(ARP) IP 
48 bit[] ARP 
IP 48 bit ARP[] RFC 826[] Plummer 1982] 
IP IP ARP 
ARD IP 
ARP IP 
ARP IP 
ARP Net/3 ARP 
1 4 ARP 
21.2 ARPIT [| [| Ú 
Net/3[] ARP 
ARP 21-1 ARP 
bsdi ARP Ifnet 
ifaddr|] in ifaddr 3-32 6-5 3 6 
ifaddr 
sockaddr dl — 
in_ifaddr 
1) llinfo_arp ARP 
llinfo_arp la_prev 
la_next ARP 5 
2) IP (rtentry )] 11info arp 
la rt rtentry rtentry 
rt llinfo llinfo arp 





svr4(140.252.13.34)[] bs 
18-2 













































































sun(140.252.13.33) 





di(140.252.13.35) 




























































































































































































llinfo arp 














llinfo arp 











(140.252.13.32) 



























































rt 














flags C 




















IP 
































































































































in ifinit ([] 6-19) 

















































































































(H ) bsdi 





















































21 ARP 543 



































































































































































































































































































































































































































































































































































































































































































































































































































sockaddr dl() 





AF LINK 
IFT ETHER 
sdl alen=0 








rtentry{} 


rn_key = 
140.252.13.32 


Kal rt_gateway 
rt_flags UC 


rt ifa 















rmx_expire 





ifnet: 


ifnet_addrs: 








in_ifaddr: 





















ARP (L ) 
4) rtentry rt gateway sockaddr dl 
sdl alen 6 sockaddr dl 
5) rt ifp ifnet 
le softc[0] 
bsdi loif rt ifp.if output 

llinfo arp() llinfo arp() 1linfo_arp{} llinfo_arp{} 
llinfo arp: [la next 
ta prev lu Haprev — | tia prev fa | 






sockaddr dl() 


AF LINK 

IFT ETHER 
sdl alen=6 
0:0:c0:c2:9b:26 


sockaddr dl() 


AF LINK 

IFT ETHER 
sdl alen=6 
0:0:c0:6£:2d:40 


sockaddr dl() 


AF LINK 
IFT ETHER 








sdl alen-6 
8:0:20:3:£6:42 





















rtentry{} 


rn_key = 
140.252.13.35 


un 


rtentry{} rtentry{} 


rn_key = 
140.252.13.33 


rn_key = 
140.252.13.34 


rmx_expire 


= 


\ 





























rmx expire 














loif: 


ifnet{} 
index=3 


sl_softc[0]: 
ifnet {} 
index=2 






le. softc[0] sy 


ifnet() 
index=1 


le_softc{} 


ifaddr() 
AF LINK 
led 
IFT_ETHER 
0:0:c0:6£:2d:4e 














ifaddr{} ifaddr{} 
















in_ifaddr{} 
AF_INET 
140.252.13.66 
140.252.13.65 
255.255.255.224 


in ifaddr() 











in ifaddr() 
AF INET 
140.252.13.35 
140.252.13.63 
255.255.255.224 















021-1 ARPI)O0000000000 





544 


















































China-pubecom 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
6) in_ifaddr (U 6-8 
in_ifaddr ifaddr rt_ifa ifaddr 
) 
led IP IP in_ifaddr 
rt. ifp rt ifa 
7) la hold mbu IP 
ARP ARP mbuf 
la_hold ARP la_hold mbu IP 
8) rt_metric [| rmx_expire ARP E 
( 20 JI] ARP 
4.3BSD Reno 4.3BSD Reno[] Net/2. 
4.4BSD ARP ARP 
ARP 
Net/2 ARP IP 
E E E mbuf ( 21-1 la_hold 
) Net/3 
213 OOOO 
21-2 9[] ARP C 
0 E Ë U 
net/if arp.h arphdr 0000 
netinet/if ether.h 0000000000 
netinet/if ether.d ARP O 
0212 aaa 
21-3 ARP L | | | | | ARPJ [| 190 [| 
21.3.1 | 
| EB LH 10 21-4 
21.3.2 | 
ARP arp. inuse[] arp allocated 21-4 
ARP ARP 
netstat 
arp -a ARP sysctl 
[] 19-36 [] 21-5 
18-2 224.0.0.1 L arp 
RTF LLINFO ARP 
“ incomplete” “ permanent” 
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ifconfig arp 1 | 
0000 
loct1]SIOCAIFADDR 00 
E ern RR RIM ADD | 
Cin ifinit > RTM, DELETE 
RTM GET 

G OODARPIOD OO A 0000 ARP H 

3 O000000 yA 

pio S 

Së Š 

Ee d 

S 

Ed 

000000 0500 

Tue 

E 

EE 

de 

ZI am fot weis 

3x22 e ge 

ar Im TO 










DE Ze 


Ki 


Ra 


000000 


(ether_output) 


Trtinie D O 0 0 RTF. UP[] RTE_CLONING[] [] Citrequest > 


RTM_ADD 
RTM_DELETE 
RTM_RESOLVE 





OO000000000 
ifa rtrequest[][] 


021-3 ARPO OO0O000000000 


































































































0 E U DD D U [] 
llinfo arp struct llinfo arpl linfo_arB 0000000 
arpintrq struct ifqueue 00000000000 ARPI [IU 
arpt prune Int DO ARP D 0 D 0000000 6) 
arpt keep Int ARPIJ0O0O0000000 20) 
arpt down Int ARPD D 0 D D 0 0 DDD DD (0) 
arp inuse Int 00000 ARP D 
arp_allocated | Int 00000 ARPO O O 
arp_maxtries Int OOO (pD 0 0 D ARPD D D 0000 (5) 
arpinit done Int 00000 
uselookback int 2000000400) 

0214 9200000000 


















































546 TCP/IP 2 China+pub.tom 
A 


bsdi $ arp -a 

sun.tuc.noao.edu (140.252.13.33) at 8:0:20:3:£6:42 
svr4.tuc.noao.edu (140.252.13.34) at 0:0:c0:c2:9b:26 
bsdi.tuc.noao.edu (140.252.13.35) at 0:0:c0:6f:2d:40 permanent 
ALL-SYSTEMS.MCAST.NET (224.0.0.1) at (incomplete) 


021-5 00 18-2000 arp «0000 

























































































































































































































































































































































































































































































































































































































































































































































































































































































21.3.3 SNMP 
1[] 25.8 SNMP MIB 
ARP MIB-II (0 IPD ) 
Net/2[] Net/3 ARP 
ARP O SNMP[] 
IPO OO 00 O index = <ipNetToMedialfIndex>.<ipNetToMediaNetAddress> 
Oo E U U 0 E 
ipNetToMedialfIndex if_ index 00000 ifIndex 
ipNetToMediaPhysAddress rt_gateway Hg 
ipNetToMediaNetAddress rt key IP] O 
ipNetToMediaType rt flags 000001-0002-0003-0004-0 0000) 
O 21-6 IPO [| O O O 0 ipNetToMediaTable 
21-6 MIB-II IP ipNetToMediaTable 
ifnet 
i |] 0 
21.4 ARP [] |] 
| ARP 21-7[] | 








































































































00000 ar hrå (ARPHRD ETHER) 
00000 ar_pro (ETHERTYPE IP) 


000000 Derin) 
000000 er pin (4) 





ether type 





ether dhost ether shost 


00000 | 0000 ET. 
00 00 
6 2 2 


6 bytes 2 


U U U U ARPÚ O 
ether_header() arphdr() O O 0 ARP O 
ether_arp() 


0217 00000000 ARE) DL D ü D U D 


















































ether header arphdr 50 U 

















































































































ARP ether_arp arphdr 





































































































































































































arphdr 21-8 21-7 4 



























































Chinaepubecom SE 547 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































if arp.h 
45 struct arphdr ( f- "p 
46 u_short ar_hrd; /* format of hardware address */ 
47 u_short ar pro; /* format of protocol address */ 
48 u_char ar hin; /* length of hardware address */ 
49 u char ar pln; /* length of prøtocol address */ 
50 u short ar op; /* ARP/RARP operation, Figure 21.15 */ 
51 }; 5 
if_arp.h 
U 21-8 arpher D D 0000 ARPOO /0 0 U D D. U 
21-9 ether arp arphdr 
IP ARP 48 bit 32 bit 
IP 
if_ether.h 
79 struct ether arp { 
80 struct arphdr ea hdr; /* fixed-size header */ 
81 u char arp sha[6]; /* sender hardware address */ 
82 u char arp spa[í4]; /* sender protocol address */ 
83 u_char arp thal6l; /* target hardware address */ 
84 u_char arp_tpal4]; /* target protocol address */ 
85 T: 
86 #define arp_hrd ea_hdr.ar_hrd 
87 #define arp_pro ea_hdr.ar_pro 
88 #define arp hln ea hdr.ar hln 
89 #define arp pln ea hdr.ar pln 
90 #define arp op ea hådr.ar op 
if ether.h 
[] 21-9 ether arp [] Ü 
ARP llinfo_arp 21-10 
ARP 21- 
1 ARP 
: — if ether.h 
103 struct llinfo arp ( 
104 struct llinfo arp “la next; 
105 struct llinfo arp “la prev; 
106 struct rtentry “la rt; 
107 struct mbuf “la hold; /* last packet until resolved/timeout */ 
108 long la asked; /* #times we've queried for this addr */ 
109 }; 
110 #define la timer la rt-»rt rmx.rmx expire /* deletion time in seconds */ 
if ether.h 
[] 21-10 11info. arg O 
Net/2 ARP 
ARP Net/3 ARP 
ARP ARP 
ARP 
104-106 insquel| remque la rt 




































































































































































548 











































































































China-pubecom 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
rt_llinfo la_rt 
107 ARP IP 
ARP ARP la_hold 
la_hold 
108-109 la asked IP! 21-24 
ARP 
110 rt_metrics rmx_expire ARP 
0 ARP | | | 
21.5 arpwhohas[|[] 
arpwhohas arpresolve ARP 21-11 
IP 
(U 6-28 SIOCSIFADDRioctD 
IP arpwhohas 
arprequest 
196 void IRRE 
197 arpwhohas (ac, addr) 





198 struct arpcom *ac; 
199 struct in_addr *addr; 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































— i arprequest (ac, &ac->ac ipaddr.s addr, &addr->s_addr, ac->ac enaddr); 
pe if ether.c 
0 21-11 arpwhohas [I DO UD ARPOO 
196-202 arpcom ([] 3-26) le softc (O 3-20) 
ac ipaddr IP SIOCSIFADDRi oct I 
(O 6-28)[] ac enaddr 
addr ARP IP 
addr| ac ipaddr arprequest IP 
IP | 
21.6 arprequest|| |] 
arprequest arpwhohas ARPI] 
ARP 
ARP 
ether output[| ether output mbuf 
21-7 
IP ( 21-3 ip output 
ether output) sa family AF UNSPEC 
ether output 
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ether output arpreslove 21-3 
arprequest ether output ether output 
arpresolve 

21-12 mbuf[] sockaddr 

eh) ea 











































i 
EAS 00000 


on 1 100 
A 


m_type 


sockaddr () mbuf {} 
re el mnet (NULL 
l m 
m 


MT_DATA 
M_PKTHDR 
28 


m pkthdr.len 






















































































[m pkthår .revif [NULL 
OOO 
(720 0) 
ea — 
ether arp() 
(2800) 
0 21-12 arprequest [] [| [] sockaddr [| mbuf 
21-13 arprequest 
if ether.c 


209 static void 

210 arprequest (ac, sip, tip, enaddr) 
211 struct arpcom *ac; 

212 u long *sip, *tip; 

213 u char *enaddr; 


214 { 

215 struct mbuf *m; 

216 struct ether header *eh; 

217 struct ether arp *ea; 

218 struct sockaddr sa; 

219 if ((m = m_gethdr (M_DONTWAIT, MT DATA)) == NULL) 
220 return; 

221 m->m len = sizeof(*ea); 

222 m-»m pkthdr.len = sizeof(*ea); 

223 MH ALIGN(m, sizeof(*ea)); 

224 ea = mtod(m, struct ether arp *); 

225 eh - (struct ether header *) sa.sa data; 

226 bzero((caddr t) ea, sizeof(*ea)); 

227 bcopy((caddr t) etherbroadcastaddr, (caddr t) eh->ether dhost, 
228 sizeof (eh->ether_dhost)); 


0 21-13 arprequest [000000 ARP 0 0 0 Ú 


550 





TCP/IP 











China-pubecom 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































229 eh->ether_type = ETHERTYPE_ARP; /* if output () will swap */ 
230 ea->arp_hrd = htons (ARPHRD_ETHER); 
231 ea->arp_pro = htons (ETHERTYPE_IP); 
232 ea->arp_hln = sizeof(ea->arp_sha); /* hardware address length */ 
233 ea->arp_pln = sizeof(ea->arp spa); /* protocol address length */ 
234 ea->arp_op = htons (ARPOP REQUEST); 
235 bcopy((caddr t) enaddr, (caddr t) ea->arp sha, sizeof(ea-»arp sha)); 
236 bcopy ((caddr_t) sip, (caddr t) ea->arp spa, sizeof(ea->arp_spa)); 
237 bcopy((caddr t) tip, (caddr t) ea-»arp tpa, sizeof(ea-»arp tpa)); 
238 Sa.sa family - AF UNSPEC; 
239 sa.sa len = sizeof (sa); 
240 (*ac->ac if.if output) (&ac->ac if, m, &sa, (struct rtentry *) 0); 
241 ) : 
if ether.c 
D 21-13 (0) 
1. mbuf 
209-223 mbu MH ALIGN[] 28 
ether arp mbu m data mbuf 
ether output 14 mbu 
2. 
224-226 ea[] eh ether arp O[] bzero 
0 8 
3. 
227-229 ETHERTYPE ARP 
21-14 
Ë Ë [] [] [] 
ETHERTYPE IP 0x0800 IP[] 
ETHERTYPE ARP 0x0806 ARP 
ETHERTYPE REVARP 0x8035 [ ARPO 
ETHERTYPE IPTRAILERS | 0x1000 0000000) 
0 21-14 00000000 
RARP IP RARP 
TCP/IP 1 5 RARP 
4. ARP 
230-237 ether_arp ARP 
ARPHRD_ETHER 1 6 
4 IP arp pro 21-14 IP (0x800) 21-15 
ARP RARP 
5. sockaddr 
238-241 sa family AP UNSPEC|| sa member 
16 ether output 



















































































Chinaspubecom me 551 




































































0 E U U [] 
ARPOP REQUEST 1 U U 00000 ARPO O 
ARPOP REPLY 2 0 0 ARPOO 
ARPOP_REVREQUEST 3 0000000 RARPO O 
ARPOP_REVREPLY 4 OO RARPO O 

















0 21-15 ARPI DD 


21.7 arpintr|] |] 































































































































































































































































































































































































4-13 ether_input ETHERTYPE_ARP 
NETISR_ARP ARP arpintrq 
arpintr 21-16 

— if ether.c 
319 void 
320 arpintr() 
321 I 
322 struct mbuf *m; 
323 struct arphdr *ar; 
324 int s; 
325 while (arpintrq.ifq head) ( 
326 s = splimp(); 
327 IF_DEQUEUE (karpintrg, m); 
328 splx(s); 
329 if (m == 0 |! (m->m_flags & M_PKTHDR) == 0) 
330 panic("arpintr"); 
331 if (m->m_len >= sizeof(struct arphdr) && 
332 (ar = mtod(m, struct arphdr *)) && 
333 ntohs (ar->ar_hrd) == ARPHRD_ETHER && 
334 m-»m len >= sizeof (struct arphdr) + 2*ar-»ar hln + 2*ar->ar_pln) 
335 switch (ntohs (ar->ar_pro)) { 
336 case ETHERTYPE_IP: 
337 case ETHERTYPE_IPTRAILERS: 
338 in arpinput (m); 
339 continue; 
340 } 
341 m_freem(m); 
342 } 
343 } 

if_ether.c 








O 21-16 arpintr 0002020000 ARP) D 0 DTD D. 0 0 0 






































319-343 while 





















































































































































arphdr 
























































ETHERTYPE IP 









































































































































ETHERTYPE_IPTRAILERS in_arpinput 

















































































































































































































































































































arphdr[] o 0 arphdr 





















































































































































552 TCP/IP 2 China-bubucom 
iene 


21.8 in arpinput[] [| 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































arpintr ARP / ARP 
1) IP 
ARP ARP IP 
2) ARP ARP 
sockaddr_dl 
ARP 
arprequest ARP 
IP 
3) ARP IP 
Net/3 ( 
in arpinout ARP 
4) ARP 
ARP 
ARP 
ARP 
5). ARP ARP 
ARP 
IP ARP 10 4.6 ARP 
Net/3 ARP ARP arp 
IP pub 21-20 21-12 
in_arpinput 21-17 
358-375 ether_arp (arp_intr ) ea 
ARP ( ) op 
IP isaddr[] itaddr 
1. IP 
376-382 Internet (in_ifaddr 6-5) 
IP ifnet OT mbuf 
)] for IP IP IP 
IP 
383-384 maybe_ia 0 IP 
out([] 21-19) mbu 
ARP IP 
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IP IP myaddr IP 
( JO myaddr IP IP 

















































































































































































































- - if_ether.c 
358 static void 


359 in_arpinput (m) 
360 struct mbuf *m; 









































































































































361 { 
362 struct ether_arp *ea; 
363 struct arpcom *ac = (struct arpcom *) m->m_pkthdr.rcvif; 
364 struct ether_header *eh; 
365 struct llinfo_arp *la = 0; 
366 struct rtentry *rt; 
367 struct in_ifaddr *ia, *maybe_ia = 0; 
368 struct sockaddr dl *sdl; 
369 struct sockaddr sa; 
370 struct in addr isaddr, itaddr, myaddr; 
371 int op; 
372 ea = mtod(m, struct ether arp *); 
373 op - ntohs(ea-»arp op); 
374 bcopy((caddr t) ea->arp spa, (caddr t) & isaddr, sizeof(isaddr)); 
375 bcopy((caddr t) ea->arp tpa, (caddr t) & itaddr, sizeof(itaddr)); 
376 for (ia = in ifaddr; ia; ia = ia-»ia next) 
377 if (ia->ia_ifp == &ac-»ac if) { 
378 maybe ia - ia; 
379 if ((itaddr.s_addr == ia->ia addr.sin addr.s addr) || 
380 (isaddr.s addr -- ia-»ia addr.sin addr.s addr)) 
381 break; i 
382 } 
383 if (maybe_ia == 0) 
384 goto out; 
385 myaddr = ia ? ia->ia addr.sin addr : maybe_ia->ia_addr.sin_addr; 
if_ether.c 
0 21-17 in arpinput [00000000 
21-18 in_arpinput 
386 if (!bemp((caddr_t) ea->arp_sha, (caddr_t) ac->ac_enaddr, if_ether.c 
387 sizeof (ea->arp_sha))) 
388 goto out; /* it's from me, ignore it. */ 
389 if (!bcmp((caddr t) ea->arp sha, (caddr t) etherbroadcastaddr, 
390 Sizeof(ea-»arp sha))) I ` 
391 log (LOG ERR, 
392 "arp: ether address is broadcast for IP address %x!\n", 
393 ntohl (isaddr.s_addr)); 
394 goto out; 
395 } 
396 if (isaddr.s_addr == myaddr.s addr) ( 
397 log (LOG ERR, 
398 "duplicate IP address %x!! sent from ethernet address: %s\n", 
399 ntohl (isaddr.s_addr), ether_sprintf (ea->arp_sha)); 
400 itadár = myaddr; 
401 goto reply; 
402 } 


eset ether.c 
U 21-18 in arpinput 0 0 000 D 0.0 0 D 0 








554 
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TCP/IP 2 
2. 
386-388 
389-395 
3; IP 
396-402 IP myaddr IP 
s IP 
myaddr reply([] 21-19) ARP 
== IP 
21-19 in_arpinput 
if_ether.c 
403 la = arplookup(isaddr.s addr, itaddr.s_addr == myaddr.s_addr, 0); 
404 if (la && (rt = la->la_rt) && (sdl = SDL(rt->rt_gateway))) { 
405 if (sdl->sdl_alen && 
406 bemp((caddr_t) ea->arp_sha, LLADDR(sdl), sdl->sdl alen)) 
407 log (LOG_INFO, "arp info overwritten for %x by %s\n", 
408 isaddr.s_addr, ether_sprintf (ea->arp_sha)); 
409 bcopy ((caddr_t) ea->arp_sha, LLADDR(sdl), 
410 sdl->sdl_alen = sizeof (ea->arp_sha)); 
411 if (rt->rt_expire) 
412 rt->rt expire = time.tv sec + arpt keep; 
413 rt->rt_flags &= ”RTF REJECT; 
414 la->la_asked = 0; 
415 if (la->la_hold) ( 
416 (*ac->ac if.if output) (&ac->ac if, la->la hold, 
417 rt_key(rt), rt); 
418 la->la_hold = 0; 
419 } 
420 } 
421 reply: 
422 if (op != ARPOP_REQUEST) { 
423 out: 
424 m freem(m); 
425 return; 
426 ) : 
if ether.c 
D 21-19 in arpinput [000000 ARP [I U LI UDO ARPO l 
4. IP 
403 arplookupl] ARP IP (isaddr) ARP 
IP IP ARP 1 
ARP 0 ARP 
ARP 
ARP 
ARP 
0 ARPO [D ( ) llinfo_ 


































































































































































































21 








ARP 





















































555 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































arp 

5. 
404 if 

1) ARP ARP (O la ) 

2) ARP (rt) 

3) re gateway sockaddr_dl 

ARP IP 

6. 

405-408 (sdl_alen)[] 0 
ARP 
ARP 
IP 

7. 

409-410 rt_gateway sockaddr_dl 
sockaddr_dl (sdl_alen) 6 
ARP ( 21-3) 

8. ARP 

411-412 
20 (arpt keep)[] arp ARP 
ARP 0 21-24 ARP ( ARP ) 
0 
413-414 RTF REJECT la asked 0 
arpresolve ARP 
415-420 ARP ARP mbuf mbuf 
( 21-1 mbu ARP 
ether_outout arpresolve 
mbuf 

9. ARP 
421-426 ARP 

in_arpinput 21-20 ARP 

ARP 
1) 
2) ARP 
ARP ARP 
10. 


























































































































556 TCP/IP 2 China-bubıcom 
—— EE 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































427—432 IP myaddr 
( Jl] arpcom 
ARP else 
- - if ether.c 
427 if (itaddr.s addr == myaddr.s addr) { 
428 /* I am the target */ 
429 bcopy ((caddr_t) ea->arp sha, (caddr t) ea->arp tha, 
430 sizeof (ea->arp_sha)); 
431 bcopy((caddr t) ac->ac_enaddr, (caddr t) ea->arp_sha, 
432 sizeof (ea->arp_sha)); 
433 } else { 
434 la = arplookup(itaddr.s addr, 0, SIN PROXY); 
435 if (la == NULL) 
436 goto out; 
437 rt = la->la_rt; 
438 bcopy ((caddr_t) ea->arp_sha, (caddr t) ea->arp_tha, 
439 sizeof (ea->arp sha)): 
440 sdl = SDL(rt->rt gateway); 
441 bcopy (LLADDR (sdl), (caddr t) ea->arp sha, sizeof(ea-»arp sha)); 
442 } 
443 bcopy ((caddr t) ea->arp_spa, (caddr t) ea->arp tpa, sizeof(ea->arp_spa)); 
444 bcopy((caddr t) & itaddr, (caddr t) ea->arp_spa, sizeof(ea->arp_spa)); 
445 ea->arp_op = htons (ARPOP_REPLY); 
446 ea->arp_pro = htons(ETHERTYPE IP); /* let's be sure! */ 
447 eh = (struct ether_header *) sa.sa_data; 
448 bcopy((caddr t) ea->arp_tha, (caddr t) eh->ether dhost, 
449 sizeof (eh->ether_dhost) ); 
450 eh->ether_type = ETHERTYPE_ARP; 
451 sa.sa_family = AF_UNSPEC; 
452 sa.sa len = sizeof (sa); . 
453 (*ac-»ac if.if output) (&ac-»ac if, m, &sa, (struct rtentry +) 0); 
454 return; : 
455 } å 
if ether.c 
0 21-20 in_arpinput] 0 000 ARP 0 0 0 ü D l 
11. ARP 
433-437 ARP 
arplookup 0 SIN_PROXY 
SIN_PROXY 1 ( 
ARP J] out mbu 
12. 
437-442 ARP ARP 
ARP 
IP ARP 
ARP| arp pub 
IPQ O ( )0 [] ARP 
13. ARP 
443-444 ARP 
IP IP itaddr 
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IP ( 21-18) 
445-446 ARP ARPOP_REPLY ETHERTYPE_IP 


u ” 








































































































































































































































































































ETHERTYPE_IPTRAILERS|| arpintr 

(trailer encapsulation) 
14. sockaddr 

447-452 sockaddr 14 21-12 











































































































































































































































































































453-455 ARP 


21.9 ARPI 1000 








































































































































































































































































































































































































































































































































































































































































































































































































































































































ARP — HI 
| | 21-1 21-10 #define 
rmx_expire ARP 
21.9.1 arptimer 
21-21 5 ARP 
if ether.c 
74 static void 
75 arptimer(ignored_arg) 
76 void *ignored_arg; 
771 
78 int s = splnet(); 
79 struct llinfo arp “la = llinfo arp.la next; 
80 timeout(arptimer, (caddr t) 0, arpt prune * hz); 
81 while (la !- &llinfo arp) ( 
82 struct rtentry *rt = la-»1a rt; 
83 la = la->la next; 
84 if (rt-»rt expire && rt-»rt expire «- time.tv sec) 
85 arptfree(la->la prev); /* timer has expired, clear */ 
86 ) 
87 splx(s); 
88 : 
e Z 
U 21-21 axptimer 000050040000 ARED O l! 
1. 
80 arp_rtrequest arptimer arptimer 5 
(arpt_prune) 




































































2. ARP 
81-86 ARP ( ) 
































































































































































































































arptfree rt_expire 





































































































21.9.2 arptfree[] |] 




































































21-22 arptfree arptimer llinfo_dl 
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ARP 
1. ( ) 
467-473 | 0 rt gatewary 
sockaddr_dl arptfree|| 
1) 
2) [] la asked 0 
3) RTF_REJECT 
sdl_alen 0 ARP 
s - if ether.c 
459 static void 
460 arptfree(la) 
461 struct llinfo arp “la; 
462 ( 
463 struct rtentry *rt = la->la_rt; 
464 struct sockaddr dl *sdl; 
465 if (rt == 0) 
466 panic("arptfree"); 
467 if (rt-»rt refcnt > 0 && (sdl = SDL(rt-»rt gateway)) && 
468 sdl->sdl family == AF LINK) { 
469 sdl->sdl alen = 0; 
470 la->la asked = 0; 
471 rt->rt flags &= "RTF REJECT; 
472 return; 
473 } 
474 rtrequest (RTM_DELETE, rt_key(rt), (struct sockaddr *) 0, rt_mask(rt), 
475 ` 0, (struct rtentry **) 0); 
476 } " 
if ether.c 
U 21-22 axpt£ree [JD [I 000000 ARP 0 0 0 
2. 
474-475 rtrequest 21.13 | | arp_ 
rtrequestl] arp rtrequest ARP mbuf([] la hold 
) llinfo arp 
21.10 arpresolve[|[]| 
4-16 ether output arpresolve IP 
arpreslove 1 IP 
arpresolve OL] arpsolve 
llinfo_arp la_hold “ (held)” IP ARP 
ARD IP 
arpresolve ARP ARP 
ARP IP 
IP ether_output 










































































































































































11.9 ARP 






































































































































21-23 










































































arpresolve 








Chinaspubecom um 559 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































252-261 dst Sockaddr in IP 
( 6 ) 
- if ether.c 
252 int 
253 arpresolve(ac, rt, m, dst, desten) 
254 struct arpcom *ac; 
255 struct rtentry *rt; 
256 struct mbuf *m; 
257 struct sockaddr *dst; 
258 u char *desten; 
259 ( 
260 struct llinfo arp “la; 
261 struct sockaddr dl *sdl; 
262 if (m-»m flags & M BCAST) ( /* broadcast */ 
263 bcopy((caddr t) etherbroadcastaddr, (caddr t) desten, 
264 sizeof (etherbroadcastaddr) ); 
265 return (1); 
266 } 
267 if (m->m_flags & M_MCAST) { /* multicast */ 
268 ETHER MAP IP MULTICAST(&SIN(dst)->sin addr, desten); 
269 return (1); 
270 ) 
271 if (rt) 
272 la = (struct llinfo arp *) rt-»rt llinfo; 
273 else ( 
274 if (la = arplookup(SIN(dst)->sin addr.s addr, 1, 0)) 
275 rt = la-»1a rt; 
276 } 
277 if (la == || rt == 0) L 
278 log (LOG DEBUG, "arpresolve: can't allocate llinfo"); 
279 m freem(m); 
280 return (0); 
281 } S 
ee if etheric 
0 21-23 arpresolve TOU 000000 ARPOO 
1. 
262-270 mbuf[] M BCAST 
1 M MCAST ETHER MAP IP MULTICAST([] 12-6)]] D 
2. llinfo_arp 
271-276 la 
llinfo_arp arplookup IP 
1 arplookup ARP 0 
ARP 
277-281 rt|| la 
arplookup rt| la 
0 
21-24 arpresolve ARP 
ARP 
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TCP/IP 2 
if_ether.c 
282 sdl = SDL(rt->rt_gateway); 
283 /* 
284 * Check the address family and length is valid, the address 
285 * is resolved; otherwise, try to resolve. 
286 */ 
287 if ((rt-»rt expire -- 0 || rt-»rt expire » time.tv sec) && 
288 sdl->sdl family == AF LINK && sdl->sdl alen != 0) ( 
289 bcopy (LLADDR(sdl), desten, sdl-»sdl alen); 
290 return 1; 
291 } 
292 /* 
293 * There is an arptab entry, but no ethernet address 
294 * response yet. Replace the held mbuf with this 
295 * latest one. 
296 */ 
297 if (la->la hold) 
298 m freem(la->la hold); 
299 la->la hold = m; 
300 if (rt-»rt expire) ( 
301 rt->rt flags &= ~RTF_REJECT; 
302 if (la->la asked == || rt-»rt expire !- time.tv sec) { 
303 rt-»rt expire - time.tv sec; 
304 if (la->la_asked++ « arp maxtries) 
305 arpwhohas (ac, &(SIN(dst)-»sin addr)); 
306 else { 
307 rt-»rt flags |- RTF REJECT; 
308 rt-»rt expire += arpt down; 
309 la->la asked = 0; 
310 } 
311 } 
312 J 
313 return (0); 
314 ) . 
IT. d ether.c 
U 21-24 arpresolve 00000 ARPD 0 0 0 0 D D 0 0 0 0 D 0 D D 0 ARP l 
3. ARP 
282-291 ARP ARP 
1) ( 0) 
2) [| rt gateway sdl family AF LINK 
3) (sdl alen) 0 
arptfree ARP sdl alen 0 
sockaddr_dl desten 1 
4, IP 
292-299 ARP 
ARP la hold mbuf la hold 
ARP ARP IP 
IP la hold NFS 
NFS 8500 IP 6 
ARP ARP ip_output ether_output 5 










































































































































































21 


561 








ARP 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ARP NFS 6 
5. ARP ARP 
300-314 RFC 1122 ARP ARP 
ARP Net/3 ARP 
° Net/3 ARP 
. SM ARP ( 5 ) RTF REJECT 
1 20 ether output[] 20 
IP EHOSTDOWN[] EHOSTUNREACH(|] 4-15 ) 
s 20 arpresolve | | ARP 
0( ) RTF_REJECT 
ARP la_asked ARP 
0 ( ) 
ARP ARP 
( time_tv_usec ) 
la_asked 5(arp maxtries) 1 5 
arpwhohas ARP 5 ARP RTF_REJECT 1 
20 la_asked 0 
21-25 arpresolve[] ether output ARP 
Oooo 1-2 3 4 5 6 7 8 9 10 11 12 13 14 49 50 51 52 
RERERERERERE ERE 
= d | d d En P 16 D a ss 36 
ARP ARP ARP ARP ARP CN NN ARP 
oo 00 00 nn H eRe OECT EHOSTDOWN 00 
U U 
02135 OO ARED H 0 0000 0 
261] 0 10[] 36 0.5 IP 
1-52 
ARP ARP 
. Il] la asked O[] la hold 1[] rt. expire 
(GO) la asked 1 ARP 0 
. 2 | 1[] la hold 20 | rt_expire 
don [] ARP 0 
. 3 2] la hold 3 (11) 
rt expire(10) rt_expire Ill] la asked 1 5 
ARP la asked 2 
° 4 30 la hold 4 rt expire 



























































































































































5 62 TCP/IP 





























China-pubecom 















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2 
(11) 0 
. 5-10 9 ARP la asked 
5 
. 11 | 10] la hold | 11 (15) 
rt_expire(14) rt_expire 15 la_asked 5 
ARP RTF REJECT 1[] rt expire 
35( 201] jl 1a. asked 0 0 
° | [] 12 ether_output RTF_REJECT 1 | 
rt_expire(35) EHOSTDOWN ( ip_output) 
° 13[] 50 EHOSTDOWN 
. 51 RTF REJECT 1 (35) 
rt expire(35) arpresolve 
5 50 ARP 20 
ARP 
21.11 arplookupl |] 
arplookup rtallocl|] Internet ARP 
3 arplookup 
1) [] in_arpinput ARP IP ARP 
2) | in arpinput ARP ARP 
3) [| arpresolve IP ARP 
arplookup llinfo_arp 
arplookup IPU 
| 
ARP 
ARP Internet sockaddr_ 
inarp 21-26 ARP 
111 struct sockaddr inarp { eten 
112 u char sin len; /* sizeof(struct sockaddr inarp) = 16 */ 
113 u_char sin_family; /* AF INET */ 
114 u short sin port; : 
115 struct in_addr sin_addr; /* IP address */ 
116 struct in_addr sin_srcaddr; /* not used */ 
117 u_short sin_tos; /* not used */ i 
118 u short sin other; /* 0 or SIN PROXY */ 
on if etherh 
0 21-26 sockaddr inarp [00 
111-119 8 Sockaddr in sin family AF INET 8 
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sin srcaddrl|| sin tos[| sin other 
sin other SIN PROXY(l) 
21-27 arplookup | 
: — if ether.c 
480 static struct llinfo arp * 
481 arplookup(addr, create, proxy) 
482 u long addr; 
483 int create, proxy; 
484 ( 
485 struct rtentry *rt; 
486 static struct sockaddr inarp sin - 
487 (sizeof (sin), AF INET); 
488 sin.sin_addr.s_addr = addr; 
489 sin.sin_other = proxy ? SIN_PROXY : 0; š 
490 rt = rtallocl((struct sockaddr *) &sin, create); 
491 if (rt == 0) 
492 return (0); 
493 rt->rt_refcnt--; 
494 if ((rt->rt_flags & RTF GATEWAY) || (rt->rt flags & RTF_LLINFO) == 0 || 
495 rt->rt gateway->sa family != AF LINK) í 
496 if (create) 
497 log (LOG DEBUG, "arptnew failed on %x\n", ntohl(addr)); 
498 return (0); 
499 } 
500 return ((struct llinfo_arp zi rt-»rt llinfo); 
501 } : 
if ether.c 
U 21-27 arplookup 00.0 0 0 0 UU l 0 ARPU 0 
1. sockaddr_inarp 
480-489 sin_addr IP proxy 0 
sin_other SIN_PROXY 0 
2. 
490-492 rtallocl[] Internet IP create 0 
UL ) 
3. 
493 ARD 
= på rt_refent ARP 
494-499 RTF_GATEWAY RTF_LLINFO 
rt_gateway AF_LINK 
arptnew Net/2 ARP 
rtallocl RTF_CLONING 
arp rtrequest (21.13[] ) rtrequest 
































21.12 [][] ARP 


























Net/3 | ARP | ARP arp pub 


















































































































































564 



















































































































































































China-pubecom 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
ARP arp_rtrequest ( 
21-28 ) RTF_ANNOUNCE 1 
ARP | IP ARP 
Oxf f f f £ f f £ 
SIN_PROXY 1 21-27 rtallocl 
21-20 arplookup 
SIN_PROXY 
|] HI ARP ARP | 
HI | ARP ARP ( 
HI ) arp -d “ published” 
ARP 
( ) 
sockaddr_inarg [| (J 21-26)[] sin other SIN PROXY 
12 Internet ([] 18-39) 8 
SIX PROXY arplookup rtallocl sin other 
SIN PROXY SIN PROXY 
ARP ARP 
ARP HD 
1) HS HD ARP HS HD 
2) 
3) HS HD 
4) HD HD HD 
netb ARP 14.6 arp - 
a * published (proxy only)” 
21.13 arp rtrequest[]|[]| 
21-3 ARP ARP 
1) arplookup rtallocl ARP 
ARP 
RTF CLONING 
( ) RTF CLONING 
rtallocl[] RTM RESOLVE rtrequest 18-2 
140.252.13.33[] 140.252.13.34 140.252.13.32 
2) arptfree[] RTM DELETE rtrequest ARP 
arp ARP arp 
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RTM RESOLVE|| RTM DELETE||RT GET 
rtrequest rtallocl 
IP rtinit 
rtreguest RTM ADD RTF_UP| | RTE CLONING 18- 
2[] 140 252 13 32 
19 ifaddr (ifa_rtrequest ) 
6-17 
in_ifinit arp_rtrequest ARP 
arp_rtrequest arp_rtrequest 
ARP 
arp_rtrequest llinfo_arp 
RTM_DELETE arp_rtrequest llinfo_arp 
21-28 arp_rtrequest 
- if ether.c 
92 void 
93 arp_rtrequest (req, rt, sa) 
94 int reg; 
95 struct rtentry *rt; 
96 struct sockaddr *sa; 
97 1 
98 struct sockaddr *gate = rt->rt gateway; 
99 struct llinfo arp “la = (struct llinfo arp zi rt->rt_llinfo; 
100 static struct sockaddr dl null sdl = 
101 (sizeof(null sd1), AF LINK); 
102 if (!arpinit done) { 
103 arpinit done - 1; i 
104 timeout (arptimer, (caddr t) 0, hz); 
105 } 
106 if (rt->rt flags & RTF GATEWAY) 
107 ` return; 
108 switch (reg) { 
109 case RTM_ADD: 
110 dÉ 
111 * XXX: If this is a manually added route to interface 
112 * such as older version of routed or gated might provide, 
113 * restore cloning bit. 
114 */ 
115 if ((rt-»rt flags & RTF HOST) == 0 && 
116 STN (YE mask(rt))->sin addr.s addr != Oxffffffff) 
117 rt->rt flags |= RTF CLONING; 
118 if (rt-»rt flags & RTF CLONING) { 
119 /* h 
120 * Case 1: This route should come from a route to iface. 
121 */ 
122 rt_setgate(rt, rt_key(rt), 
123 (struct sockaddr *) &null sdl); 
124 gate = rt->rt gateway; 
125 SDL(gate)->sdl type = rt->rt ifp->if type; 
126 SDL(gate)->sdl index =. rt-»rt ifp->if index; 
127 rt-»rt expire = time.tv sec; 


O 21-28 arp rtrequest [| [| 0 RM ADD [] [] 
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MÀ 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































128 break; 
129 } 
130 /* Announce a new entry if requested. */ 
131 if (rt->rt flags & RTF_ANNOUNCE) 
132 arprequest ( (struct arpcom *) rt->rt_ifp, 
133 &SIN(rt_key (rt) )->sin_addr.s_addr, 
134 &SIN (YC Kev (rt) )->sin_addr.s_addr, 
135 (u_char *) LLADDR(SDL(gate))); 
136 /* FALLTHROUGH */ . 
if_ether.c 
U 21-28 (U) 
1. ARP timeoult 
92-105 arp_rtrequest ( 
) timeout arptimer ARP 
arptimer timeout 
2. 
106-107 RTF GATEWAY RTF GATEWAY 
ARP 
108 switch RTM ADD[] RTM RESOLVE[] RTM DELETE( 
) 
3. RTM ADD 
109 RTM ADD arp ARP rtinit 
IP (O 21-3) 
4. 
110-117 RTF_HOST ( 
) 1 
RTF CLONING 
/etc/netstart 









































route add -net 224.0.0.0 -interface bsdi 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































18-2 RTF CLONING | 
5. 
118-126 RTF_CLONING(in_ifinit ) 
rtinit rt setgate[| sockaddr_dl 
rt gateway 21-1[] 140.252.13.32 
sdl family[|sdl len null sd 
sdl type( IFT ETHER)[]sdl index ifnet 
sdl alen 0 
127-128 break 
rmx expire 21-1 
llinfo arp arptimer 
sockaddr dl rt gateway 
RTM RESOLVE rtrequest 
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netstat sdl_index link#n 18-2 
6. ARP 
130-135 RTF_ANNOUNCE arp pub 
(1) sockaddr_inarp sin_other SIN_PROXY 
(2) RTF_ANNOUNCE RTF_ANNOUNCE arprequest 
ARP ARP IP 
IP 
136 RTM_RESOLVE case 
21-29 arp_rtrequest RTM_RESOLVE 
rtallocl RTF_CLONING rtallocl 
(arplookup[] create ) 0 llinfo arp 
if. ether.c 
137 case RTM RESOLVE: 
138 if (gate->sa family !- AF LINK |l 
139 gate->sa len < sizeof(null sdl)) { 
140 log(LOG DEBUG, "arp rtrequest: bad gateway value"); 
141 break; 
142 H 
143 SDL (gate) ->sdl_type = rt->rt_ifp->if_type; 
144 SDL (gate) ->sdl_index = rt->rt_ifp->if_index; 
145 if (la != 0) 
146 break; /* This happens on a route change */ 
147 JE i 
148 * Case 2: This route may come from cloning, or a manual route 
149 * add with a LL address. 
150 */ : 
151 R_Malloc (la, struct llinfo_arp *, sizeof(*la)); 
152 rt->rt_llinfo = (caddr_t) la; 
153 if (la == 0) ( i 
154 log (LOG DEBUG, "arp_rtrequest: malloc failed\n"); 
155 break; 
156 } 
157 arp_inuse++, arp_allocated++; 
158 Bzero (la, sizeof(*la)); 
159 la->la_rt = rt; 
160 rt->rt_flags |= RTF_LLINFO; 
161 insque (la, &llinfo arp); 
162 if (SIN(rt key(rt))->sin addr.s addr == 
163 (IA SIN(rt->rt ifa))->sin addr.s addr) { 
164 /* 
165 * This test used to be 
166 * if (loif.if flags & IFF UP) 
167 * Tt allowed local traffic to be forced 
168 * through the hardware by configuring the loopback down. 
169 * However, it causes problems during network configuration 
170 * for boards that can't receive packets they send. 
171 * It is now necessary to clear "useloopback" and remove 
172 * the route to force traffic out to the hardware. 
173 *y 
174 rt->rt_expire = 0; 











[] 21-29 arp rtrequest JO [| RIM RESOLVE DD 
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EEN 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































175 Bcopy (( (struct arpcom *) rt->rt ifp)->ac enaddr, 
176 LLADDR (SDL (gate)), SDL(gate)->sdl_alen = 6); 
177 if (useloopback) 
178 rt->rt ifp = &loif; 
179 } 
180 break; if_ether.c 
U 21-29 (0) 
7. sockaddr_dl 
137-144 rt_gateway O U sockaddr dl sa familyl| sa_len|| || 
( | IFT_ETHER) | sockaddr_dl | 
8. 
145-146 llinfo_arp 
la arp_rtrequest llinfo_arp 
break 
9. llinfo_arp 
147-158 llinfo_arp rt Llinfo 
arp inuse[|arp allocated I] 11linfo arp 0 la hold 
la asked 0 
159-161 rt llinfo arp RTF LLINFO 18-2 
ARP 140.252.13.33[] 140.252.13.34[] 140.252.13.35 L 240.0.0.1 
arp (U 19-36) insque[] llinfo arp 
ARP rtrequest ( 
JU arp rtrequest llinfo arp 0 ARP 
arpresolve 
arplookup arp rtreguest ( 21-3) 
arpresolve ARP 
10. 
162-173 4.4BSD ( ODD ) 21-1 
IP (140.252.13.35)[] if IP 
11. 
174-176 0 — arpcom 
rt_gateway sockaddr_d1 
12. 
177-178 usrloopback 0( 1) 
g 4.4BSD[] 
/etc/netstart 
route add 140.252.13.35 127.0.0.1 
IP 4.4BSD 
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IP 
ARP 
IP RTM_RESOLLVE 
arp_rtrequest 21-30 RTM_DELETE|] 21-3 
arp ARP 
arptfree 
if_ether.c 
181 case RTM_DELETE: 
182 if (la == 0) 
183 break; 
184 arp_inuse--; 
185 remque (la); 
186 rt->rt_llinfo = 0; 
187 rt->rt_flags &= "RTF LLINFO; 
188 if (la->la hold) 
189 m freem(la->la hold); 
190 Free((caddr t) 1a); 
191 } 
192 ) 2 
if ether.c 
[] 21-30 arp rtrequest][][] RIM DELETE [] [] 
13. la 
182-183 1a llinfo arp 
break 
14. llinfo arp 
184-190 arp inuse[]l[] remque llinfo arp 
rt llinfo 0 RTF LLINFO ARP mbuf( ARP 
JO O O mbu llinfo arp 
switch default RTM GET | | 
arp RTM GET route output rtrequest 
21-3 RTM GET rtallocl 0 
rtallocl rtrequest 
21.14 ARP[I [| Ü 
IP ip_output 
(U [] 12-40) ip output 
( 8-24) IP 
18-2 224.0.0.0 " flag" 
224 (le0) 
(O 225-239 ) 
224.0.11( ) 224.0.0.0 
IP_MULTICAST_IF 
18-2 224.0.0.0 
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TCP/IP 2 
leo 
arpresolve 
21-23 ETHER MAP IP MULTICAST 
23 (O 12-6) ARP 
ARP 
ARP 
21-5 RTF LLINFO ARP 
ARP ETHER MAP IP MULTICAST 
ARP ARP 
18-2 224.0.0.1[] rtrequest rt_metrics ( 
19-9) 21-28 rmx_expire RTM_ADD 
224.0.0.1 
arptimer 224.0.0.1[] ARP 
21.15 DD 
ARP IP 
Net/3 BSD ARP 
llinfo_arp 21-1 
ARP 
ARP 
in_arpinput IP ARP 
IP ARP 
ARP Net/3 BSD 
ARP 5 
20 ARP 
U U 
21.1 21-17 ac 
21.2 ping arp -a 
ARP 
21.3 21-19 sdl_alen 6 
21.4 Net/2 ARP arpresolve 
ARP Net/3 
21.5 Net/2 ARP ARP 3 
ARP Net/3 
Net/3 
21.6 Net/3 ARP 
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21.7 [] 21-1 0 Ú [| rmx_expirel] |] OOOOODO | 

21.8 000 ARPH 0 U U U U U B D 0 0 U U U U ARPO U U U 

219 00000 21-250 0000 CL sock] [] [] 500 ms 
LU U D D DDD D 0 D 0 D UDP OO (000 -p U U U 0 0 0 U 
i) 100000 280sT0o0m[|OOOOOOD I 100 UDPTI 0 O Å 

Oo O 21-25] I II pil 

21.10 ARP 0 ARP LU U U U U U U U U U 0 U 

0 U U U U U 0 00 0 U UD 0 0 

























































































254 10 


U 220 U U DU U 




































































UDP 








(PCB) 




















TCP[] | 
















































































Internet 














(Internet protocol control block) 





TCP 
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Internet PCB 


| Internet! 


(TCP control block) 
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in pcb 











22-1 











































































































e|| socket 





























accept 
DTYPE_SOCKET 
SOCK_STREAM 




















socket 









































































































































file 
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LU | 














socket 























RAM 





SOCK_DG 





TCP 
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pcb 
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Internet PCB( 

















inpcb ) 


















































inp_socket 


socket 




























































































( tcpcb 




































































inpcb 






































UDP inpcb 
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inp. ppcb 












































inpcb 








inp faddr 

















inp lport 











IP 
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inp next 





















































Internet PCB 
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TCP 
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IP 
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TCP 














UDP 


























IP 








PCB 







































































IP 



























































in_pcbdetach 






































PCB 











32 





























IP 








in_pcballoc 














PCB 
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HDD HDD 000 000 
' U ' | 
filet) filet) filet) filet) 











DTYPE SOCKET DTYPE SOCKET 


socket () socket {} socket {} socket {} 










SOCK_DGRAM SOCK_STREAM 


inpcb{} 


udb: 








inp_faddr inp_faddr 


inp_faddr inp faddr 





inp fport linp fport 
inp. laddr inp laddr 


inp lport inp lport 
inp. ppcb 





| S 








^ - » 
Internet) DD [1 [] tepcbt} 








0 22-1 Internet LL L0 0 0 0 D 00 0 0 0 0 0 0 D 0 


22.2 Ul Ul 


PCB C 22-2 































































































































































































netinet/in pcb.h in_pebJ O00 
netinet/in_pcb.c PCBO D 











022-2 00000000 





574 





TCP/IP 2 




































































China"pub.tom 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































22.2.1 | 
22-3 
zeroin addr | struct in_addr 32bit] 9 PO [] 
1223 0000000000 
22.2.2 
Internet PCB[] TCP PCB malloc M_PCB 
60 mbuf M BUF[] socket 
M SOCKET 
PCB 
vmstat -m netstat -m mbuf 
22.3 inpcb|| |] |] 
22-41 inpcb 84 
in_pcb.h 
42 struct inpcb { -P 
43 struct inpcb *inp_next, *inp prev; /* doubly linked list */ 
44 struct inpcb *inp_head; /* pointer back to chain of inpcb's for 
45 this protocol */ 
46 struct in_addr inp_faddr; /* foreign IP ađdress */ 
47 u_short inp_fport; /* foreign port# */ 
48 struct in_addr inp_laddr; /* local IP address */ 
49 u_short inp_lport; /* local port# */ 
50 struct socket *inp socket;  /* back pointer to socket */ 
51 caddr t inp ppcb; /* pointer to per-protocol PCB */ 
52 struct route inp route; /* placeholder for routing entry */ 
53 int inp flags; /* generic IP/datagram flags */ 
54 struct ip inp ip; /* header prototype; should have more */ 
55 struct mbuf *inp options; /* IP options */ 
56 struct ip moptions *inp moptions; /* IP multicast options */ 
57 ); . 
in pcb.h 
O 22-4 ine [] [] 
43-45 inp next[] inp prev) UDP[] TCP PCB 
PCB (inp. head) UDP PCB[] inp head 
udb([] 22-1) TCP PCB tcb 
46-49 inp. faddr|J inp fport|| inp laddr[| inp lport 
IP IP IP PCB 




































































































































































































































































TCP[] UDP Internet PCB IP 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































| [Partridge 1987] 
RDP 8 bit | 8 bit | | LU 
2|] RDP [Partridge[] Hinden 1990] 16 bit | Ü 0 
TCP[] tcpcb UDP PCB[] 
| 
50-51 inp socket [] PCB[] socket [] inp. ppcb[] U 
PCB 0 22-1 inp_ppcb|] TCP 
tcpcb UDP socket[] inpcb 0 
Internet PCB( ) PCB | 
socket ( IP| ) 
52 IP ipp route 
ICMP Internet PCB IP IP 
PCB inp_route PCB IP 
U U U l U U 
53 inp_flags L 22-5 
inp_flags [] [] 
INP HDRINCL U D D 0 DD PIDODDOND) 
INP_RECVOPTS U D D IPD D 0 D D D 0 0 (10000000) 
INP RECVRETOPTS | Q000 IPD D 0 0 D D 0 0 0 D OD UDpD D 0 D 0 0 ) 
INP_RECVDSTADDR NPD OD DO DD DO U D U U (00 UDP) 
INP_CONTROLOPTS INP_RECVOPTS| INP-RECVRETOPTS| INP_RECVDSTADDR 
D 22-5 inp flags [J 
54 PCB IP IO U TOS[] TTL[] TOS 
UL JO TTL TCP[] UDP TTL 64 
IP TOS[| IP_TTL]|] | inpcb-inp ip 
O U TCP[] UDP] [] [| IP III III IP 
55-56 IP_OPTIONS[] [J | | IP ip_pcbopts 
mbuf| inp options mbuf| 
TCP[] UDP ip output | IP IP[] IP 
IP inp_moptions IP 
22.4 in, pcballoc[] in pcbdetach[|[] 
TCP[] UDP IP Internet PCB Socket 
PRU ATTACH UDP 23-33 



























































































































































struct socket *so; 


int error; 


error 


22-6 


in pcballoc(so, &udb); 






































in pcballoc 
PCB | 








































































































576 TCP/IP 2 China-bubıtoM 
Pet a 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































in pcb. 
36 int mp b.c 
37 in pcballoc(so, head) 
38 struct socket *so; 
39 struct inpcb *head; 
40 ( 
41 struct inpcb *inp; 
42 MALLOC (inp, struct inpcb *, sizeof(*inp), M PCB, M WAITOK); 
43 if (inp == NULL) 
44 return (ENOBUFS); 
45 bzero((caddr_t) inp, sizeof(*inp)); 
46 inp->inp_head = head; 
47 inp->inp_socket = so; 
48 insque(inp, head); 
49 so->so_pcb = (caddr_t) inp; 
50 return (0); 
51 ) . 
in pcb.c 
[] 22-6 in pcballoc 000000 Internet PCB 
36-45 in, pcballoc MALLOC PCB 
Net/2 Internet PCB[] TCP PCB mbu 
80[] 108 Net/3 84[] 140 TCP 
mbu Net/3 mbu 
2-6 PCB 17[] mbuf| 
Net/3 mbu Internet PCB[] TCP PCB Net/3 mbu Unix 
PCB netstat mbu 
mbu Internet 
bzero|] PCB 0 PCB IP 0 
in pcb.c 
252 int SH 
253 in pcbdetach(inp) 
254 struct inpcb *inp; 
255 { 
256 struct socket *so = inp->inp socket; 
257 so->so_pcb = 0; 
258 sofree (so); 
259 if (inp->inp_options) 
260 (void) m_free (inp->inp_options); 
261 if (inp->inp_route.ro_rt) 
262 rtfree (inp->inp_route.ro_rt); 
263 ip_freemoptions (inp->inp_moptions); 
264 remque (inp); 
265 FREE (inp, M PCB); 
266 } . 
in pcb.c 
D 22-7 in pcbdetach 2000000090 Internet PCB 
2. 
46-49 in head PCB (udb[] tcp)l] inp. socket Socket 






















































































22 




















577 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































PCB (insque)[] socket PCB[] insque 
PCB 
PRU DETACH[] | Internet PCB o 22-7 
in_pcbdetach | 
252-263 socket PCB OL] sofree PCB 
IP mbu m_free PCB rtfree 
ip_freemoptions 
264-265 remque PCB TU | PCB 
225 1010000000 
HUU | LU 
| 
1. IP 
22-8 bind IP 
— (well-known 
port) — 
(ephemeral port) 
bind IP 22-8 3 6 
* 
O D 1Pg O U U 0 U [ [] 
U D D 0 0 U U O0000000000 
OD U U O00000000000 
* U U O00000000000000 
U D D 0 0 0 O000000000000 
OD 0 O00000000000 
3 0 O000000000000 
022-8 bina JIIPOOOOOOOODOOO 
IP ( ) 
IP IP IP IP — 
— | U [] [] | | | IP 
g IP 
IP ([] 22-8 4 SU) 
IP (I 22-8 ) 
22-8 HEU O 
U U U U U U 
EADDRINUSE ( ) (in use) 
PCB “ u 
TCP[] UDP TCP UDP) 




















































































































578 TCP/IP 2 Chinapub.tom 
— a 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































Net/3 
SO_REUSEADDR IP ( 
) | 
] IP 140.252.1.29 
140.252.1.29 5555 127.0.0.1 
5555 IP 5555 
bind setsockopt 
SO REUSEADDR 
SO REUSEPORT [] IP O O 0 mu 
SO_REUSEADDR 
140.252.1.29[] IP 
140.252.1.29 6666 SO_REUSEPORT 
140.252.1.29 6666 
140.252.1.29 
6666|] IP 
SO REUSEPORT[] Net/3 4.4BSD 
IP 
O O so REUSEPORTII |] | E LU u 
0 O OO Solaris 2.x SO_REUSEADDR 
IP 
2 UDP 
connect TCP UDP UDP 
connect IP 
UDP 
UDP IP bind 
connect IP 
22-9 UDP 
OOOO OOd0 U [ 
locallP.Iport | foreignIP.fport | UOODODOO 
socket (), bind (*.Iport), connect (foreignIP, fport) 
socket (), bind (localIP, lport), connect (foreignIP, fport) 
localIP.lport E 0800000000000 tocallP 
socket (), binfdocalIP lport) 
*.Iport MS UD D D 0 Serf 0000 
socket () , bind ( *, Iport) 
022-9 UbPD D HH D D.D D P000 0O00 0 0 






















































































UDP (connected UDP socket) UDP 














































































































(unconnected UDP socket) UDP 


























































































































































































































22 





































































































579 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































IP 
3. TCP IP 
22-10 sun Telnet LISTEN 
IP 140 252 111 1500 
140.252.129 ( 
IP ) 
U 0 D U O000 U D 0 U U DU 0 U TCP] [| 
140.252.1.29 23 * ba LISTEN 
* 23 * * LISTEN 
140.252.1.29 23 140.252.1.11 1500 ESTABLISHED 
0 22-10 00000230 D 0 TCPO D 
IP g API 
TCP 0 TCP accept U 
( TCP ) IP 
IP TCP 
API 
TCP 23 in_pcblookup 
Internet PCB 
(wildcard match) IP 
PCB i 0 
1( IP IP VT 2( IP ) 
140.252.1.11 1500 140.252.1.29 23 
22-11 22-10 
0000 U 0 0 U 0000 0000 TCP[] l] U U D D U 
140.252.1.29 23 * * LISTEN 1 
* 23 * * LISTEN 2 
140.252.1.29 23 140.252. 1.11 1500 ESTABLISHED 0 
0 22-11 [] (140.252.1.11, 150030) (140.252.1.29, 2318000000 
(OPODO) 
( IPD DO) 
Net/3 
140.252.1.11 1501 140.252.1.29 
23 22-12 
U 0 D U (DUU U 0 D U 0000 TCP) U U 0 D 0 U 
140.252.1.29 23 * * LISTEN 1 
* 23 * * LISTEN 2 
140.252.1.29 23 140.252.1.11 1500 ESTABLISHED 
0 22-12 [] (140.252.1.11, 1501) (140.252.1.29,230 00000 












































































































































580 



































China-pubecom 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
( PCB IP 
YOU 
TCP o 22-11 
22-12 (0 0 SYN) 
in_pcblookup TCP 
O TCP IP 
O PCB 
4. UDP IP 
UDP TCP UDP 
Net/3( ) 
IP Net/3 
1) IP IP UDP 
“ ” ( ) 
2) IP UDP 
22-13 UDP UDP 
SO REUSEADDR[] SO_REUSEPORT ODO! 
IP 
140.252.1.29 577 140.252.1.11 1500 000000 mau 
140.252.13.63 577 140.252.13.35 1500 000000 P< 
140.252.13.63 577 * * O00000P=00 
* 577 * z D00000 P=o0000 
[] 22-13 1000000570 UDP DU 
140.252.13.63( 140.252.13 ) ST 
140.252.13.34 1500 22-14 
0000 0000 U 0 D U D 0 [ DU 
140.252.1.29 577 140.252.1.11 1500 0000000 1000 
140.252.13.63 577 140.252.13.35 1500 00001000 
140.252.13.63 577 * * nu 
* 577 * * OD 
D 22-14 000 (140.252.13.34, 150030) (140.252.13.63, 5770 0 00 
IP IP IP 
IP IP IP 
140.252.129( ) 577 140 252 1.111 




















































































































































































































1500 











22-15 


































































































22 


















































1 


140.252.13.63 


140.252.13.63 


* 





0000 


40.252.1.29 


[25-15 











"n 


O0 





* 


* 





140.252.1.11 
140.252.13.35 


D DD U 





D B ü or 


00000 
0000 IP 





00200 


O (140.252.1.11, 150030) (140.252.1.29, 57730 Ü 


U 


U 








581 











































































































































































































































































































22.6 in pcblookupl[] |] 







































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































in_pcblookup 
1) [| TCP[] UDP IP in_pcblookup Internet PCB 
PCB 
2) bind IP 
in_pcbbind 
3) bind 
in_pcbbind 
4) connect in_pcbbind 
( UDP connect 
23 ) 
2 3 4 in_pcbbind in_pcblookup 
SO REUSEADDR[| SO REUSEPORT 
( UDP | IP 
PCB UDP ) | 
( IP ) 
IP "^ in pcblookup 
IP BSD[] 386 Craig Leres[] 4.4BSD 
1 in pcblookup [| 2 4 
in pcbconflict 3 in uniqueport 
Net/3 
in pcblookup 
22-16 in pcblookuup 
PCB PCB match 
matchwild 







































































































































































































































































582 























































































































































































































China-pub.com 





























































































































































































































[] 22-16 in pcblookup JO U JJ I] J JJ PO 000 


TCP/IP 2 
3 ( 2 ) wildcard 
PCB 
1. 
PCB lport PCB 
— in_pcb.c 
405 struct inpcb * 
406 in_pcblookup (head, faddr, fport_arg, laddr, lport_arg, flags) 
407 struct inpcb *head; 
408 struct in_addr faddr, laddr; 
409 u_int fport_arg, lport_arg; 
410 int flags; 
411 { 
412 struct inpcb *inp, “match = 0; 
413 int matchwild = 3, wildcard; 
414 u_short fport = fport arg, lport = lport_arg; 
415 for (inp = head->inp_next; inp != head; inp = inp->inp_next) { 
416 if (inp->inp_lport != lport) 
417 continue; /* ignore if local ports are unequal */ 
418 wildcard = 0; 
419 if (inp->inp_laddr.s_addr != INADDR_ANY) { 
420 if (laddr.s_addr == INADDR_ANY) 
421 wildcard++; 
422 else if (inp->inp_laddr.s_addr != laddr.s_addr) 
423 continue; 
424 } else { 
425 if (laddr.s addr != INADDR ANY) 
426 wildcard++; 
427 } 
428 if (inp->inp_faddr.s_addr != INADDR_ANY) { 
429 if (faddr.s_addr == INADDR_ANY) 
430 wildcard++; 
431 else if (inp->inp_faddr.s_addr != faddr.s_addr || 
432 inp->inp_fport != fport) 
433 continue; 
434 } else { 
435 if (faddr.s_addr != INADDR_ANY) 
436 wildcard++; 
437 } 
438 if (wildcard && (flags & INPLOOKUP_WILDCARD) == 0) 
439 continue; /* wildcard match not allowed */ 
440 if (wildcard < matchwild) { 
441 match = inp; 
442 matchwild = wildcard; 
443 if (matchwild == 0) 
444 break; /* exact match, all done */ 
445 } 
446 } 
447 return (match); 
448 3 å 
in pcb.c 











China-pubscom . 583 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2. 
419|] 427 in pcblookup PCB laddr 
wildcard 1 | 
PCB wildcard 
22-17 
PCB[] [| IP | laddr[] [] 0 Ú] 
OG * * wildcard++ 
UU: OO * O0POOOOOOOOGOOOO PCB 
* E U DU D U 
* OG * wildcard++ 
[] 22-17 in pcblookup 000 PH] II D D 
3. 
428|| 437 
IP 
22-18 IP 
PCB[] [| IP | faddr[] [] [] [] 
OM * * wildcard++ 
ODO + UU: OO IPD 0 D D D 0 D 0 D 000000 PCB 
* * U DU D U 
* OM * wildcard++ 
O 22-18 in peblokp 000000 IPC] D U 0 
22-18 PCB 
0 connect 
IP 
22-10 22-13 
4. 
438|] 439 flags INPLOOKUP WILDCARD 
(wildcard ) 
PCB TCP[] UDP INPLOOKUP WILDCARD 
( 22-10 22-13 ) 
connect flags 0 
5. 
440—447 
(wildcard[] 0) PCB 
— TCP 
22-19 22-11 TCP in_pcblookup 
140.252.1.11 1500[] 140.252.1.29 23 PCB 














































































































































































































584 iu China"pubitom 
A ss 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































laddr IP lport TCP faddr IP fport TCP 
PCB[] 
wildcard 
O000 0000 unu U DU D U 
140.252.1.29 23 * * 1 
* 23 * * 2 
140.252.1.29 23 140.252.1.11 1500 0 
D 22-19 laddr =140.252.1.29]] lport= 23[] faddr = 140.252.1.11[] fport= 1500 
wildcardl] I( IP JO flags 
INPLOOKUP_WILDCARD match PCB[] matchwild 1 
wildcard[] 2( IP ) 
matchwild wildcard|[ 0 
matchwild(l) match 
PCB 
TCP[] UDP in pcblookup 
faddr[] laddr IP 
flags 
in pcblookup in pcbbind 
in pcbconnect 












































































































































22.7 in pcbbind[|[] 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































in pcbbind 
1) bind TCP ( ) 
2) bind UDP ( 
) 
3) connect TCP ([] TCP 
) 
4) listen TCP ( 
TCP [| listen[] TCP ) 
5) [| in pcbconnect(22.8[] ) IP ( 
UDP connect UDP sendto ) 
3 4 5 IP 
( ) 
1 2 (explicit bind) 30 40 5 (implicit bind) 
2 
(RPC) 
RPC ( 10 29.40 Sun 
) 


























China=pubecom B 585 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































in pcbbind 22-20 
in pcb.c 
52 int P 
53 in pcbbind(inp, nam) 
54 struct inpcb *inp; 
55 struct mbuf “nam; 
56 ( 
57 struct socket *so = inp->inp_socket; 
58 struct inpcb *head = inp->inp head; 
59 struct sockaddr_in *sin; 
60 struct proc *p = curproc; /* XXX */ 
61 u short lport = 0; 
62 int wild = 0, reuseport = (so->so_options & SO_REUSEPORT); 
63 int error; 
64 if (in_ifaddr == 0) : 
65 return (EADDRNOTAVAIL); - : 
66 if (inp->inp lport || inp->inp_laddr.s_addr != INADDR_ANY) 
67 return (EINVAL); 
68 if ((so->so_options & (SO_REUSEADDR | SO_REUSEPORT)) == 0 && 
69 ((so->so proto-»pr flags & PR CONNREQUIRED) == 0 || 
70 (so-»so options & SO ACCEPTCONN) == 0)) 
71 wild = INPLOOKUP WILDCARD; ji 
in_pcb.c 
0 22-20 in pebbind 000009000000 
64-67 | | | | | IP 
68-71 if SO_REUSEADDR|| SO_REUSEPORT 
wild INPLOOKUP_WILDCARD 
UDP PR CONNREQUIRED 
[Torek 1992] SO ACCEPTCONN 
listen (15.9[] ) TCP 
socket[| bind listen in_pcbbind{] bind 
| Socket listen bind[] TCP 
PRU LISTEN in pcbbind SO ACCEPTCONN 
if SO ACCEPTCONN 
af 
if ((so->so options & (SO REUSEADDR|SO REUSEPORT)) == 0 && 
((so-»so proto->pr flags € PR CONNREQUIRED)==0 | |1) 
wild = INPLOOKUP_WILDCARD; 
1 
if ((so-»so options & (SO REUSEADDR|SO REUSEPORT)) == 0 ) 
wild = INPLOOKUP WILDCARD; 
REUSE wild 0 
REUSE | wild INPLOOKUP WILDCARD 
in pcblookup REUSE 
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TCP/IP 2 
in_pcbbind 22-22 nam 
72-75 bind nam 
(connect[] listen[] in pcbconnect 30 4[] SU nam 
Sockaddr in mbuf 22-21 
nam 
nami [] PCBD D D DDD 
localIP Iport inp_laddr inp_iport O O 
OM * 0 localIP U H 00 localIP[] BB D] 0000 
OM * DD localIP Iport O00 in_pcblookup 
* 0 S (000 
* Ooo * Iport ODO in_pcblookup 
[] 22-21 in pcbbind [| nam[] 000000 
76-83 in pcbconnect([] 22-25) 
85-94  Net/3 IP SO REUSEADDR 
SO REUSEPORT 
95-99 ifa_ifwithaddr 
“ yech" 0 ifa 
ifwithaddr IP 
bind (sin zero[8]) 8 
ifa ifwithaddr in pcbbind 
100-105 (Y 22- 
21 2 4 ) if 
1024(IPPORT_RESERVED) Internet 
1024 (reserved port) 
rcmd [Stevens 1990] rlogin|| rsh 
106-109 in pcblookup([] 22-16) IP 
PCB | IP ( IP ) | 0 
( ) in_pcblookup PCB IP 
— IP sin->sin addr[] lport 
REUSE wild 
INPLOOKUP WILDCARD 
111 IP PCB 
IP IP 
IP IP 
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72 if (nam) { ini pbg 
73 sin = mtod(nam, struct sockaddr in *); 
74 if (nam->m_len !- sizeof(*sin)) 
75 return (EINVAL); 
76 #ifdef notdef 
77 /* 
78 * We should check the family, but old programs 
79 * incorrectly fail to initialize it. 
80 E 
81 if (sin->sin family !- AF INET) 
82 return (EAFNOSUPPORT): 
83 #endif 
84 lport = sin->sin port;  /* might be 0 */ 
85 if (IN_MULTICAST (ntohl (sin->sin_addr.s_addr))) { 
86 /* l 
87 * Treat SO_REUSEADDR as SO_REUSEPORT for multicast; 
88 * allow complete duplication of binding if 
89 * SO_REUSEPORT is set, or if SO_REUSEADDR is set 
90 * and a multicast address is bound on both 
91 * new and duplicated sockets. 
92 */ 
93 if (so->so options & SO_REUSEADDR) 
94 reuseport = SO_REUSEADDR | SO_REUSEPORT; 
95 } else if (sin->sin_addr.s_addr != INADDR ANY) { 
96 sin->sin_port = 0; /* yech... */ 
97 if (ifa ifwithaddr((struct sockaddr *) sin) == 0) 
98 return (EADDRNOTAVAIL); 
99 ) 
100 if (lport) { 
101 struct inpcb *t; 
102 /* GROSS */ 
103 if (ntohs(lport) < IPPORT RESERVED && 
104 (error = suser (p->p_ucred, &p->p acflag))) 
105 return (error); 
106 t = in_pcblookup (head, zeroin_addr, 0, 
107 sin->sin_addr, lport, wild); 
108 if (t && (reuseport & t->inp_sockét->so_options) == 0) 
109 return (EADDRINUSE); 
110 } 
111 inp->inp laddr = sin->sin_addr; /* might be wildcard */ 
112 } i ç 
in_pcb.c 
U 22-22 in pcbbind [] 0 D D D D D 0 nam D] O 
0 nam ( ) in pcbbind 
113-122 (TCP[] UDP) PCB head 
tcb[] udb head PCB inp next[] inp. back inpcb 
head PCB 
PCB 1024 
(IPPORT RESERVED) 1 5000(IPPORT USERRESERVED) 1024 
in pcbbind 
1. SO REUSEADDR| 
in pcbbind||in pcblookup REUSE 


































































































































































































588 TCP/IP 2 China=pubecom 
— HH 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































113 if (lport == 0) in_pcb.c 
114 do ( 
115 if (head->inp_lport++ < IPPORT RESERVED || 
116 head->inp_lport > IPPORT USERRESERVED) 
117 head->inp lport = IPPORT RESERVED: 
118 lport = htons(head->inp. lport); 
119 ) while (in pcblookup (head, 
120 zeroin addr, 0, inp-»inp laddr, lport, wild)); 
121 inp->inp lport = lport; ] 
122 return (0); 
123 } 
in_pcb.c 
O 22-23 inpebbind 00000000000 
1) TCP[] UDP socket[] bind bind[] TCP 
IP 23(Telnet ) 
SO REUSEADDR 
in pcbbind[| INPLOOKUP WILDCARD in pcblookup 
in pcblookup PCB 
TCP in pcbbind 0 
2) 
in pcblookup {*, 23] [] PCB wildcard 
0 in pcblookup reuseport|] 0 
in pcbbind EADDRINUSE 
3) SO_REUSEADDR 
in_pcbbind in_pcblookup 
0 12,2330 PCB in pcblookup 
(U 22-17) wildcard|] QU) in pcbbind EADDRINUSE 
SO_REUSEADDR 
4) Telnet {*, 23} 
(140.252.13.35[] 23} 
SO_REUSEADDR in_pcblookup 
INPLOOKUP_WILDCARD * 23[] PCB wildcard 1 
TCP PCB 
in pcbbind EADDRINUSE 
5) {140.252.13.35, 23} 
SO_REUSEADDR 
in_pcblookup 0 
12,2330 PCBU [| wildcard 1 flags 0 
TCP PCB | 














































































































































































































in pcbbind 0 








22 
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6) [*,23] Telnet 
{140.252.13.35, 23] | 
[] [] U | 23 
in_pcblookup INPLOOKUP_WILDCARD 
SO_REUSEADDR {140.252.13.35, 23] [] PCB 
wildcard 1 TCP PCB 
in_pcbbind EADDRINUSE 
7) 0 IP 0 
{140.252.13.35, 23} Telnet 
(127.0.0.1, 23} | SO_REUSEADDR 
0 0 in pcbbind 0 in_pcblookup|] |] 0 
INPLOOKUP_WILDCARD {140.252.13.35, 23)[] PCB 
IP in_pcblookup in_pcbbind 0 
0000000000 so REUSEADDRI [I 000000 PO 0 0 
wildcard 0 PCB TP IP 
O O | in_pcblookup INPLOOKUP_WILDCARD] DD 
8) | | | U 
IP 127.0.0.1 
0 in pcblookup[] 0 PCB 0 
SO REUSEADDR wildcard 
0 in pcblookup in pcbbind EADDRINUSE 
IP SO REUSEADDR | 
22-24 localIP1[] local P2 IP 
localmcastIP PCB 
in_pcbbind 
[] SO. REUSEADDR[] SO_REUSEPORT 
SO REUSEADDR 
LocalIPl | localIP1 | qq Oo POOOOOOOOOO 
locallP1 | locallP2 | n [] ` 000000000090 
localIP1 i U U O000000000000000000 
å localIPl | QQ O000000000000000000 
* ji U U U D 0 D D DU D 00000000) 
locallP1 | locallP1 | Ú H DH H H H 
[ 22-24 so REUSEADR []D D D D D 0 D] 0 œn 0 0 0 D 
2. SO_REUSEPORT 
Net/3 SO REUSEPORT in pcbbind SO REUSEPORT 













































































































































































































































































22.8 in_pcbconnect|| |] 

















in_pcbconnect 











0 IP 
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TCP/IP 2 
1) connect TCP ( TCP ) 
2) connect UDP (L) UDP UDP ) 
3) UDP ( ) sendto 
4) ( SYN ) LISTEN ([] TCP ) 
TCP tcp input 
in pcbconnect IP 
in pcbconnect 
in_pcbconnect 22-25 
in pcb.c 
130 int + 
131 in_pcbconnect (inp, nam) 
132 struct inpcb *inp; 
133 struct mbuf “nam; 
134 ( 
135 struct in_ifaddr *ia; 
136 struct sockaddr_in *ifaddr; 
137 struct sockaddr in “sin = mtod(nam, struct sockaddr in +); 
138 if (nam->m_len !- sizeof(*sin)) 
139 return (EINVAL); 
140 if (sin->sin_family != AF_INET) 
141 return (EAFNOSUPPORT); 
142 if (sin->sin port == 0) 
143 return (EADDRNOTAVAIL); 
144 if (in ifaddr) { 
145 /* I 
146 * If the destination address is INADDR_ANY, 
147 * use the primary local address. 
148 * If the supplied address is. INADDR_BROADCAST, 
149 * and the primary interface supports broadcast, 
150 * choose the broadcast address for that interface. 
151 * 
152 #define satosin(sa) ((struct sockaddr in *) (sa)) 
153 #define sintosa(sin) ((struct sockaddr *) (sin)) 
154 #define ifatoia(ifa) ((struct in_ifaddr *) (ifa)) 
155 if (sin->sin_addr.s_addr == INADDR_ANY) 
156 sin->sin_addr = IA SIN(in ifaddr)->sin addr; 
157 else if (sin-»sin addr.s addr == (u long) INADDR BROADCAST && 
158 (in ifaddr->ia ifp->if flags & IFF BROADCAST)) 
159 sin->sin addr = satosin(&in ifaddr->ia broadaddr)->sin addr; 
160 ) " ç 
in_pcb.c 
U 22-25 in pcbeonneet 900000000000 POO 
1. 
130-143 nam sockaddr_in IP mbu 
0 
25 0.0.0.0[] 255.255.255.255 
134-160 in ifaddr IP 
0.0.0.0(INADDR ANY) IP IP 0.0.0.0 
IP 255.255.255.255 (INADDR_BROADCAST) 
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255.255.255.255 UDP 
IP — 
255.255.255.255 IP 
22-26 TCP[] UDP 
11 2[] 3 
: i z in_pcb.c 
161 if (inp->inp_laddr.s_addr == INADDR ANY) ( 
162 struct route *ro; 
163 ia = (struct in_ifaddr *) 0; 
164 /* 
165 * If route is known or can be allocated now, 
166 * our src addr is taken from the i/f, else punt. 
167 */ 
168 ro - &inp-»inp route; 
169 if (ro-»ro rt && 
170 (satosin(&ro-»ro dst)->sin addr.s addr != 
171 sin-»sin addr.s addr || 
172 inp-»inp.socket-»so options & SO DONTROUTE)) { 
173 RTFREE(ro-»ro rt); 
174 ro-»ro rt - (struct rtentry *) 0; 
175 ) 
176 if ((inp-»inp socket->so options & SO DONTROUTE) == 0 && /* XXX */ 
177 (ro-»ro rt == (struct rtentry *) 0 || 
178 ro-»ro rt-»rt ifp -- (struct ifnet *) 0)) ( 
179 /* No route yet, so try to acquire one */ 
180 ro->ro dst.sa family = AF INET; 
181 ro-»ro dst.sa len - sizeof(struct sockaddr in); 
182 ((struct sockaddr in *) &ro-»ro dst)->sin addr = 
183 sin-»sin, addr; 
184 rtalloc(ro); 
185 } 
186 /* 
187 * If we found a route, use the address 
188 * corresponding to the outgoing interface 
189 * unless it is the loopback (in case a route 
190 * to our address on another net goes to loopback). 
191 */ 
192 if (ro-»ro rt && !(ro->ro_rt->rt_ifp->if_flags & IFF LOOPBACK)) 
193 ia - ifatoia(ro-»ro rt-»rt ifa); 
194 if (ia == 0) ( 
195 u short fport = sin->sin port; 
196 sin->sin port = 0; 
197 ia = ifatoia(ifa ifwithdstaddr(sintosa(sin))); 
198 if (ia == 0) 
199 ia = ifatoia(ifa_ifwithnet (sintosa (sin))); 
200 sin->sin port = fport; i 
201 if (ia == 0) 
202 ia = in_ifaddr; 
203 if (ia == 0) 
204 return (EADDRNOTAVAIL); 
205 } 





in_pcb.c 
D 22-26 in pcbconmect DO D D D TOO IPOD 
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TCP/IP 2 
164-175 PCB 
SO_DONTROUTE 
PCB 3 
UDP in_pcbconnect sendto 
UDP in pcbconnect[| ip output[]| in pcbdisconnect 
IP in pcbconnect 
UDP sendt 
IP 
ip output 
SO DONTROUTE IP 
IP 
4. 
176-185 SO_DONTROUTE PCB 
rtalloc 
De 
186-205 ia (in  ifaddr[] 6.5] ) 
IP PCB rtalloc 
ifa withdstaddr 
ifa withnet IP 
0 fport 
IP (in ifaddr) (in ifaddr[] 0) 
22-27 in_pcbconnect 
206-223 ( 
IP MULTICAST IF ) IP IP 
224-225 22-26 ia 
sockaddr_in ifaddr 
in_pcblookup 22-28 
6. 
227-233 in_pcblookup 
in_pcbconnect ifaddr 
0 TCP 
TCP sun TCP 
(8888 -b ) in_pcblookup 
connect EADDRINUSE( 1 CH sock ) 
bsdi S sock -b 8888 sun echo & 00000000 
bsdi S sock -A -b 8888 sun echo [00000 





connect () error: 
























































Address already in use 
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in pcb.c 
206 /* 7 
207 * If the destination address is multicast and an outgoing 
208 * interface has been set as a multicast option, use the 
209 * address of that interface as our source address. 
210 */ 
211 if (IN_MULTICAST (ntohl (sin->sin_addr.s_addr)) && 
212 inp->inp_moptions != NULL) { 
213 struct ip_moptions *imo; 
214 struct ifnet *ifp; 
215 imo = inp->inp moptions; 
216 if (imo->imo multicast ifp != NULL) { 
217 ifp = imo->imo multicast ifp; 
218 : for (ia = in ifaddr; ia; ia = ia->ia next) 
219 if (ia->ia_ifp == ifp) 
220 break; 
221 if (ia == 0) 
222 return (EADDRNOTAVAIL); 
223 } 
224 } 
225 ifaddr = (struct sockaddr_in *) &ia->ia addr; 
226 } . 
in pcb.c 
U 22-27 in pcbconect [][I[U UU Lut 0 0 tL D 0 
i ë : I in_pcb.c 
227 if (in_pcblookup(inp->inp_head, 
228 sin->sin_addr, 
229 sin->sin_port, 
230 inp->inp_laddr.s_addr ? inp->inp laddr : ifaddr->sin addr, 
231 inp->inp_lport, 
232 0)) 
233 return (EADDRINUSE); 
234 if (inp->inp_laddr.s_addr == INADDR_ANY) { 
235 if (inp->inp_lport == 0) 
236 (void) in pcbbind(inp, (struct mbuf +) 0); 
237 inp->inp laddr = ifaddr->sin_addr; 
238 ) 
239 inp->inp faddr = sin->sin_addr; 
240 inp->inp_fport = sin->sin port; 
241 return (0); 
242 } . 
in pcb.c 
D 22-28 in pcbcomect 000000020000 
- A SO REUSEADDR bind connect 
(8888) 
bsdi sun 
22-28 in pcblookup 0 
UDP 
UDP 
connect UDP sendto 
7. 
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TCP/IP 2 
234-238 ifaddr 
22.7 30 40 5 
in_pcbbind | in pcbbind 
inp_laddr in_pcbbind 
8. PCB 
239-240 PCB IP 
PCB mg — 
IP 
IP IP 
TCP[] UDP[] PCB inp_laddr IP 
bind IP ULU in_pcbbind ifa_ifwithaddr 
) in pcbconnect 
( ) 
IP ip output 
IP 
Net/3 (8.4[] ) 
22.9 in pcbdisconnect||[| 
ip pcbdisconnect[] UDP IP O(INADDR ANY) 
0 
UDP UDP 
connect | sendto UDP 
in pcbconnect udp output 
in pcbdisconnect 
in pcbdisconnect in pcbdetach PCB 
PCB 
22-29 in pcbdisconnect 
243 int in, pcb.c 
244 in pcbdisconnect (inp) 
245 struct inpcb *inp; 
246 { 
247 inp->inp_faddr.s_addr = INADDR ANY; 
248 inp->inp_fport = 0; 
249 if (inp->inp_socket->so_state & SS_NOFDREF) 
250 in pcbdetach(inp); 
— in_pcb.c 
0 22-29 in pcbdisconneet [JD D [DL D U DD U U D D 0 
PCB (SS NOFDREF ) in pcbdetach([] 22-7) 


























































































































PCB 
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22.10 in setsockaddr[| in_setpeeraddr|]| |] 



























































getsockname ( Internet IP 



































































































































JU getpeername 
PRU SOCKADDR!|| PRU PEERADDR in setsockaddr 








































































































































































































in setpeeraddr 22-30 
























































































































































































































































































































































































































































































































































































































































































































































































































































in pcb.c 
267 int + 
268 in_setsockaddr(inp, nam) 
269 struct inpcb *inp; 
270 struct mbuf *nam; I 
271 I 
272 struct sockaddr in *sin; 
273 nam->m len = sizeof(*sin); 
274 sin = mtod(nam, struct sockaddr in *); 
275 bzero((caddr t) sin, sizeof(*sin)); 
276 sin->sin family = AF INET; 
277 sin->sin len = sizeof(*sin); 
278 sin->sin port = inp->inp lport; 
279 sin->sin addr = inp->inp laddr; 
280 ) å 
in pcb.c 
U 22-30 in setsockedar 000000000000 
nam mbuf sockaddr_in 
IP 
Internet PCB sin addr[] sin port 
22-31 in setpeeraddr 22-30 PCB 
IP 
in pcb.c 
281 int pe 
282 in_setpeeraddr (inp, nam) 
283 struct inpcb *inp; 
284 struct mbuf “nam; 
285 { 
286 struct sockaddr_in *sin; 
287 nam->m_len = sizeof(*sin); 
288 sin = mtod(nam, struct sockaddr_in *); 
289 bzero((caddr_t) sin, sizeof(*sin)); 
290 sin->sin_family = AF_INET; 
291 sin->sin_len = sizeof (*sin); 
292 sin->sin_port = inp->inp_fport; 
293 sin->sin_addr = inp->inp_faddr; 
294 } š 
in_pcb.c 
0 22-31 in setpeeradr 000000000000 
22.11 in pcbnotify[] in_rtchange[] in_losing[] [| 
ICMP in_pcbnotify 
PCB (TCP[] UDP) IP ICMP 
“ ” TCP 
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TCP/IP 
ICMP TCP PCB 
22-32 ICMP 
H H H H pfctlinput: 00 
0000 O00000000 
quu» 
quu» 
U 22-32 ICMPJ 00000 
ICMP icmp input[] ICMP (U 11-1 
11-2) 
° U 
ICMP ( ) 11 
protosw (7.4 pr ctlinput 
TCP[] UDP tcp_ctlinput[] udp ctlinput 
ICMP[ O | [1 [] IP 
(TCP[] UDP) ICMP D | | U 
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pfctlinput (Internet) 
TCP[] UDP[] Internet 
























































































































































































































































































































































































































































IP 

























































































TES in pcb.c 
307 in pcbnotify(head, dst, fport arg, laddr, lport arg, cmd, notify) 

308 struct inpcb *head; 

309 struct sockaddr *dst; 

310 u int fport arg, lport. arg; 

311 struct in addr laddr; 


312 int cmd; . 
313 void (*notify) (struct inpcb *, int); 

314 ( 

315 extern u, char inetctlerrmap[]; 

316 Struct inpcb *inp, *oinp; 

317 struct in_addr faddr; 

318 u_short fport = fport_arg, lport = lport_arg; 

319 int errno; f 

320 if ((unsigned) cmd > PRC_NCMDS || dst->sa family != AF INET) 
321 return; 

322 faddr = ((struct sockaddr_in +) dst)->sin_addr; 

323 if (faddr.s_addr == INADDR_ANY) 

324 return; 

325 /* 

326 * Redirects go to all references to the destination, 

327 * and use in rtchange to invalidate the route cache. 

328 * Dead host indications: notify all references to the destination. 
329 * Otherwise, if we have knowledge of the local port and address, 
330 * deliver only to that socket. 

331 */ 

332 if (PRC IS REDIRECT(cmd) || cmd == PRC HOSTDEAD) L 

333 fport = 0; 

334 lport - 0; 

335 laddr.s addr = 0; 

336 if (cmd != PRC HOSTDEAD) 

337 notify - in rtchange; 

338 } 

339 errno = inetctlerrmap[cmd]; 

340 for (inp = head->inp_next; inp != head;) { 

341 if (inp->inp_faddr.s_addr != faddr.s_addr || 

342 inp->inp_socket == 0 || 

343 (lport && inp->inp lport != lport) || 

344 (laddr.s addr && inp->inp laddr.s addr != laddr.s addr) || 
345 (fport && inp->inp fport != fport)) ( 

346 inp = inp-»inp next; 

347 continue; /* Skip this PCB */ 

348 ) . j 

349 oinp - inp; 

350 inp = inp->inp next; 

351 if (notify) 

352 (*notify) (oinp, errno); 

353 } 

354 } 


in_peb.c 
U 22-33 in seconotify U D 0 0 0 0000 0 0 0 
































598 TCP/IP 2 Chinapub.tom 
— n MA 

















22-32 TCP 
















































































































































































































































































in_pcbnotify 






































in_rtchange | 






































22-33 in_pcbnotify TCP | tcb 






























































































































































tcp_notify UDP udb 


































































































udp_notify 
1. 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































306-324 cmd | | 0.0.0.0 
2. 
325-338 ( PRC_HOSTDEAD 
IMP — ) 
0 for 
IP PCB IP 
in rtchange([] 22-34) notify 
339 inetctlerrmap (O 11-19 PRC. xxx[] ) 
Unix[] errnol] (U 11-1 ) 
3. PCB 
341-353 PCB PCB — 
if PCB]] (1) 
(2) PCB socket (3) (4) 
(5) 
notify 








































































































































































































22.11.1 in rtchange 





































































































ICMP[] [| | in pcbnotify in rtchange 

























































































| | IP PCB 22-34 





























































































































in_rtchange 





in pcb.c 
391 void + 


392 in_rtchange(inp, errno) 
393 struct inpcb *inp; 


394 int errno; 

395 ( 

396 if (inp->inp route.ro rt) ( 

397 rtfree(inp-»inp route.ro rt); 
398 inp->inp route, ro rt = 0; 

399 za 

400 * A new route can be allocated the next time 
401 * output is attempted. 

402 */ 

403 } 

404 } 


in_pcb.c 
U 22-34 in rtchange 00000000 
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PCB rtfree PCB 
PCB ip output 
pfctlinput 
22.11.2 
PCB 
Ping ping[] IP ICMP 
Ping 
1 402 521 gemini ping 14 025 213 svr4 
gemini gateway netb 22-35 
ping [] [| 
=. 



































D D O 140.252.13 


[] 22-35 ICMP O [] 











gateway 





ICMP 

















































































































gemini $ ping -sv svr4 
PING 140.252.13.34: 56 data bytes 


ICMP Host redirect from gateway 140.252.1.4 


to netb (140.252.1.183) for svr4 (140.252.13.34) 









































































































































































































































































































































































































































































































































































































































64 bytes from svr4 (140.252.13.34): icmp seq-0. time-572. ms 
ICMP Host redirect from gateway 140.252.1.4 
to netb (140.252.1.183) for svr4 (140.252.13.34) 
64 bytes from svr4 (140.252.13.34): icmp seq-1. time-392. ms 
-s ICMP -V ICMP ( 
ICMP ) 
ICMP ping 
PCB IP 
gateway {140.252.1.4} netb{140.252.1.183} 
gemini ICMP 
ping 



















































































































































































gemini $ ping -sv svr4 












































600 TCP/IP 2 China-bubıcom 
NM MEME EE gg 


PING 140.252.13.34: 56 data bytes 
64 bytes from svr4 (140.252.13.34): icmp seq-0,time-388. ms 
































































































































































































































































































































































































































































































































































































































64 bytes from svr4 (140.252.13.34): icmp seq-1. time-363. ms 
IP (U 32[] ) TCP[] UDP 
ICMP pfctlinput([] 22-32) 
IP Ping PCB 
ping 
22.11.3 ICMP UDP 
API UDP ICMP 
connect IP 
































































































































































































































in_pcbnotify 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ICMP UDP ICMP 
in pcbnotifyl] dst IP ICMP IP 
connect PCB[] inp faddr 

inp fport 0 in pcbnotify notify 22-33 
for UDP PCB 

UDP 

( bind) in pcbnotify 
ICMP 
ICMP 
ICMP 
1024[] 5000 
([] 22-23) 
— errno[] — 
UDP sendto 
UDP recvfrom ICMP 
recvfrom (ECONNREFUSED) 
errno ICMP 
API 
UDP ICMP 
ECONNREFUSED 
ICMP UDP 
ICMP 
ICMP UDP 
TCP TIME WAIT 
UDP 
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select 
API D) Unix 
V API(TLI) TLI t rcvuderr 
IP TCP/IP[] SVR4 ICMP 
UDP 
in pcbnotify[] ICMP UDP 
IP 
UDP 
22.11.4 in losing 
PCB 22-36[] in losing TCP 
in pcb.c 
361 int Séi 
362 in_losing(inp) 
363 struct inpcb *inp; 
364 ( 
365 struct rtentry *rt; 
366 struct rt_addrinfo info; 
367 if ((rt = inp->inp_route.ro_rt)) { 
368 inp->inp_route.ro_rt = 0; 
369 bzero((caddr t) & info, sizeof(info)); 
370 info.rti info[RTAX DST] = 
371 (struct sockaddr *) &inp->inp route.ro dst; 
372 info.rti info[RTAX GATEWAY] = rt->rt gateway; 
373 info.rti info[RTAX NETMASK] = rt_mask(rt); 
374 rt_missmsg (RTM_LOSING, &info, rt->rt_flags, 0); 
375 if (rt->rt_flags & RTF_DYNAMIC) 
376 (void) rtrequest (RTM_DELETE, rt_key(rt), 
377 rt->rt gateway, rt_mask(rt), rt->rt flags, 
378 (struct rtentry **) 0); 
379 else 
380 /* 
381 * A new route can be allocated 
382 * the next time output is attempted. 
383 */ 
384 rtfree(rt); 
385 } 
386 } P 
in pcb.c 
U 22-36 in losing [)000000000000 
1. 
361-374 PCB 
rt_addrinfo rt_missmsg RTM_LOSING 
| 






























































































































































602 Term n: China-pubıcom 
— — — EE 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































375-384 (RTF DYNAMIC ) 
RTM DELETE rtrequest 
22.12. I IE 
in_pcblookup PCB 
22.6 bind[] connect 
TCP[] UDP IP in_pcblookup 
TCP[] UDP 
PCB PCB 
in_pcblookup 
[Jain[] Routhier 1986] 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































[McKenney[] Dove 1992] 
PCB PCB PCB 
([McKenney[] Dove 1992] Jon Crowcroft|] [Partridge[] Pink 1993] 
Gary Delp) PCB in_pcblookup 
[McKenney[] Dove 1992] Net/l ( ) - 
PCB 
BSD [Hutchinson[] Peterson 1991] 
UDP 
22.13 TIN 
Internet Internet PCB[] TCP[] UDP IP Internet 
IP PCB 
PCB 
1) TCP[] UDP in pcblookup 













































































in pcbbind in pcbconnect 



































































































































































































































2) in pcbbind 
bind TCP connect bind 























































































































































































































U 221 









































603 














































































































































































































































































































UDP O00 sendto[] connect I DO bind 00000000 
3) in pcbconnect[] D D D U 0 U D D D 0 O D D 0 D D D 0 0 D U DE. D 0 D. U U 
U U U U DO D D ODO D DU U D U D 0 U D U D 0 U D U D 0 U D 0 D DU D 0 U 
in_pcbbind 00000000000 
U 22-370 U O0 TCPO UDPI 0000 U U U U PCB) D 0 0 0 0 0 0 0 0 0 D D D D U 
l U U 0000000000 22-370 TCPO UDP 0000000000 
ODO = 
DU 0 D U DU DDD 0 DU D DD U u DDD 0 DU D DD U 
inp_laddr inp_lport inp_faddr inp_fport 

TCP] H O O T in_pcbconnect in_pcbconnect foreignIP fport 
connect(foreignIP,| JD rtalloc[] OM in_pcbbinal] 

Sport) fereignIP] 0000 000000 
O00000000 

TCP 0000 bina localIP Iport foreignIP fport 
(docallP, lport) connect 
(foreignIP fport) 

TGP IM TD H in pcbconnect Iport port fport 
bind(*, lport) connect | JQ rtalloc[] 

(foreignIP. fport) foreign PI H 00 0 
O00000000 

TCPO OOO :bina localIP in_pcbbindl] |] foreignIP port 
(docallP, 0) connect 0000 
(foreignIP, fpori) 

TCPODODODO localIP Iport IP0000 TCPO DO 
bind(locallP, lport) U U DU D DDD 0 
listen()accept() 

tTeOOOOOO»ind| PODODODO | port foreign PO | TCPHUU 
(+, lport) listen()| O O0O000000|000000 
accept() DUU 0.0.0.0 

U DP D D DD in_pcbconnect in_pcbconnect JoreignIP fportQ OO 
sendto(foreignIP fport) | DU rtallocl OO in pcbbindl] 0000800 

foreignP 0 0 D 00 | n nnn nnn n 0000 
D DDD DD DDD D'in senato[ DDD 

D DDD DD DD 0 D 

[] [] [] 0.0.0.0 

U DP T 0 DD in pcbconnect in pcbconnect foreignIP Sport 
connect (foreignIP,| DD rtallocl OM in_pcbbinal] 
fport) write() foreignIPQ D D D D | DO OD nn nn 

D D D D D D DD | 0 writeg 000 
000000 write 
OOOO 


0 22-37 in pcbbind [] in pcbconnect JOO 








604 


U U 


22.1 


22.2 0 


22.3 


224 
22.5 
22.6 
































China-pub.com 




























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCPAPO I] OU 20 
22-230 | | | UI | | | Ú 
[] 22-100 U U U 0 0 D o 0 0 U Telnet] [] 000 U U U 
IP[] DD 000 Ip 0 0 D D D U U Telnet] [] [] 000000 
IP 
0 0 0 O (140.252.1.29, 8888} 0 | 
88880 (DU uuu (140.252.1.29, 8888] 0 
in pcbbind[] D OD | De O | | 
| IP 8888 in pcbbind 
(370 DD U 00000000. 1P000 88880000 U ut 
SO REUSEADDR in pcbbind 00000 
UDPO OO U U 0 0 U 
bind] OU sockaddr in[]J | uut 
O bind O | U 00000 bind] U 
(255.255.255.255) 

























































































ipsu tt 


pes) UD UD D 0 D D D DI 










































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































23.1 ID 
UDP | LH 
0 UDP] IP] O 
Internet SOCK[] DGRAM UDP 
(unconnected) IP 
IP 
22.5 UDP IP 
Lu u IP 
UDP 
232 [] UL Ll 
9[] UDP C 2[] UDP 23-1 
23-2 6 UDP 
6 3 6 
[] [] [] [] 
netinet/udp.h udphar 000 
netinet/udp var.h DO UDPO [J 
netinet/udp usrreq.c UDP] [J 
0231 JIOO00000 
00000 0000000 000000 


E 





ip_output 


0000 
023-2 UDPHOOOOOO0000000 
































606 TCPAPD O 020 China-pubecom 
— sa 





























































































































































































































































































































































































































































































































































23.2.1 DI 
22-3 
[] U U D 0 0 [] U 
udb Struct inpcb UDP PCB TT [] 0 O 
udp_last_inpcb | Struct inpcb * O0O000000000000 0000" 0000 
udpcksum Int O0OOOOO ver D 0 D 0 0 0 
udp in Struct sockaddr_ih 0 000000000 P0O0 
udpstat Struct udpstat UDP] D (0 23-4 
udp_recvspace u_long OOOOOOOOOOOD 41 6000 D 
udp_sendspace u_long 00000000000 921600 
1233 9000000000 
2322 JO 
LU U U U udpstat[] D D. d UDP E D D U 234 OG D D D 0 0 U B. BE. B. D 0 
udpstat[] [] O [] SNMP [1 O 
udps_badlen O0O0000000000000000 ° 
udps_badsum O0O000000000000 ° 
udps_fullsock O0O0000000000000000000 
udps hdrops D D D DDD DDD DDD 0 0 D 
udps ipackets O000000000 S 
udps_noport I0O000000000000000 N 
udps noportbcast O0OO0000000000000000000 ° 
udps_opackets O0O00000000 s 
udps_pcbcachemiss D D D D D peb D D 0 D D 0 0 DD 0 0 
D 23-4 D væstat D DD DDD UDPD D 
0 23-50 0000 netstat -ig IQ 
18,575,142 datagrams received E udps_ipackets 
0 with incomplete header udps_hdrops 
18 with bad data length field udps_badlen 
58 with bad checksum udps_badsum 
84,079 dropped due to no socket udps_noport 
446 broadcast/multicast datagrams dropped due to no socket | udps_noportbcast 
5,356 dropped due to full socket buffers udps_fullsock 
18,485,185 delivered ODO) 
18,676,277 datagrams output udps_opackets 
023-5 UDPI H 
O00 UDPO O Í LU U (ul UO DO U DO U) DO (udps ipackets)[] 
















































































U U 23-50) B U EL U oU U 0 U 

















China bubscom 


23.2.3 SNMP|] [| 



























































0 230 UDPH [| 











































































































607 














































































































O 23-60 7 UDP LU O O [ OU SNMPl] |] [] 0000000000 udpstatl] 
LU LU U LU 
O 23-70 0 0 UDP] ID B. 0 D] 0 0 udptable[]SNMP O 0 UDP PCBO 
O [] udpstat JO] 
SNMP] I udpstat[] [0 O U 
udpInDatagrams udps_ipackets 00000000000000090 
udpInErrors udps_hdrops + D D DD DD DD DDD D D D UDHA 
udps_badsumt OOO00000000000000000000 a 
udps badlen Hp UDP OOOO) 
udpNoPorts udps_noport + O0O00000000000000000 
udps noportbcast 
udpOutDatagrams udps_opackets 0000000090 
U 23-6 udp 0000 SNMP O 











UDP D D 0 0 0 U 


=<udpLocalAddress>.<udpLocalPort> 





udp 





udp 


SNMP] [] 


LocalAddress 
LocalPort 


PCB [| 


inp_laddr 
inp_lport 


U 





U 


00000000 Ip 
20000000000 











23.3 UDP[] prot 


023-7 UDPO 0 DO O udpTable 


osw(] |] 





















































































































































0 23-80 0 0 vPP0 00000 
O O inetsw[l] O [] 

pr type SOCK DGRAM UDP] 00000000 

pr domain &inetdomain UDP Internet] [] 000 

pr protocol IPPROTO_UDP (17) OOO PO 00 ie el U 

pr flags PR ATOMIC|PR ADDR | I0000000000000 

pr input Udp input OPOOOOO 

pr output 0 UDP OOD 

pr_ctlinput udp_ctlinput ICMPJ 00000000 

pr_ctloutput ip_ctloutput 000000000090 

pr usrreq udp usrreg O0000000000 

pr init udp init 000 UDP 

pr_fasttimo 0 UDPTI OOD 

pr_slowtimo 0 UDP OOD 

pr_drain 0 UDPO 0 00 

pr_sysctl udp_sysctl O sysct1 (830 00D 

O 23-8 UDP[] protosw Jj [J 

OO0OOOO0000 vee DO DO 0 D D D D 0 6000 udp_ouvtput]] O 





608 
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TCP/IP 2 
UDP udp usrreq 
23.4 UDPOOOD 
UDP udphdr 23-9[] C 23-10[] UDP 
udp.h 
39 struct udphdr { 
40 u short uh, sport; /* source port */ 
41 u_short uh_dport; /* destination port */ 
42 short uh_ulen; /* udp length */ 
43 u short uh sum; /* udp checksum */ 
44 ); E 
udp.h 
O 23-9 udphdr DI 
0 15 16 : 31 
uh, sport uh, dport ! 
160000 I 16000000 
' 81 
uh, ulen uh sum 
160 UDP [] 160 UDPO 0 D | 
(0000) 
U 23-10 UDPJ D 0 D 0 0 0 
UDP UDP IP 
udp input IP udp_output IP 
IP/UDP udpiphdr 23-11 
- udp var.h 
38 struct udpiphdr { 
39 struct ipovly ui_i; /* overlaid ip structure */ 
40 struct udphdr ui_u; /* udp header */ 
41 T: l 
42 #define ui_next ui_i.ih_next 
43 #define ui_prev ui_i.ih_prev 
44 #define ui $1 ui i.ih xl 
45 #define ui pr ui i.ih pr 
46 #define ui len ui i.ih len 
47 «define ui src ui i.ih src 
48 #define ui dst ui i.ih dst 
49 #define ui sport ui u.uh sport 
50 #define ui dport ui u.uh dport 
51 #define ui ulen ui u.uh ulen 
52 #define ui sum ui u.uh sum 
udp var.h 
D 23-11 udpiphdr TI 0 0 0 Ú) l] IP/UDPO [] 
20 IP ipovly 23-12 
8-8 IP (2000) 






































































































































Chinaspubecom BE 609 



























































































































































































































































23.6 UDP 
38 struct ipovly { N Leier 
39 caddr_t ih_next, ih_prev; /* for protocol sequence q’s */ 
40 u char ih x1; /* (unused) */ 
41 u_char ih pr; /* protocol */ 
42 short ih len; . / protocol length */ 
43 struct in_addr ih_src; /* source internet address */ 
44 struct in_addr ih_dst; /* destination internet address */ 
45 ); 


— OOOO HH var.h 


[] 23-12 ipovly O Ú 


23.5 udp init[] [| 

















































































































































































































































































































































































































































































































































































































































































































































































































domaininit UDP (udp_init 23-13) 
PCB(udb) 
udb PCB 0 PCB 
inp_lport UDP 22.4 
0 1024 

EEE AA E 

50 void udp usrreq.c 
51 udp init() 

52 { 

53 udb.inp_next = udb.inp_prev = &udb; 

54 ) 


Tem. HED usrreq.c 
O 23-13 udp init 00 


23.6 udp output[| |] 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































UDP send 
sendto[| sendmsg|| write writev 
sendto|| sendmsg sendto 
sendmsg 23-14 
udp output ip output 
sosend msghdr 
mbu sosend 
mbu PRU SEND 
UDP udp output 23-15 inp 
Internet PCB m mbu addr 
mbuf| Sockaddr in control 
mbu sendmsg 











































































































































































































































































































333-344 m freem UDP 

















610 


TCP/IP 2 
































China-pubecom 




















XXX 




















































































































TCP 



































































































































HO 
























































PRU. SEND | DI 


0000000000 


O 23-14 0 0 0 0 0 0000 0 0 væ output 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2. 
345-359 UDP (addr ) 
in pcbconnect 
EISCONN 
sendto[] [] i | 
splnet IP | 
PCB PCB 
UDP splnet 
IP (U 1-12) 
IP 
[Partridge[] Pink 1993] 
UDP 
PCB[] 0 | laddr 















































































































































































































































Chinaspubecom mee 611 





































































































in pcbconnect in pcbbind 




























































































































































































connect 

































































in pcbconnect 








SIE udp usrreg.c 
334 udp output (inp, m, addr, control) 

335 struct inpcb *inp; 

336 struct mbuf *m; 

337 struct mbuf *addr, *control; 

338 I 

339 struct udpiphdr *ui; š 

340 int len = m->m pkthdr.len; 

341 struct in_addr laddr; 

342 int s, error = 0; 

343 if (control) 

344 m_freem(control); /* XXX */ 

345 if (addr) { 

346 laddr = inp->inp laddr; 

347 if (inp->inp faddr.s addr != INADDR ANY) ( 

348 error = EISCONN; : 

349 goto release; 

350 } 

351 za 

352 * Must block input while temporarily connected. 
353 “7 

354 S = splnet (); 

355 error = in_pcbconnect (inp, addr): 

356 if (error) { 

357 splx(s); 

358 goto release; 

359 ) 

360 } else { 

361 if (inp->inp_faddr.s_addr == INADDR ANY) { 

362 error = ENOTCONN; 

363 goto release; 

364 } 

365 } 

366 /* : 
367 * Calculate data length and get an mbuf for UDP and IP headers. 
368 */ 

369 M_PREPEND (m, sizeof(struct udpiphdr), M_DONTWAIT); 
370 if (m == 0) I 

371 error = ENOBUFS; 

372 goto release; 

373 ) 





409 release: 


410 m freem(m); 
411 return (error); 
412 ) 





udp usrreq.c 


0 23-15 ude output U D 000 DOG 0 0 0 0 D 0 0 0 U 


Chinaspubecom 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































612 TCP/IP 2 
360-364 ENOTCONN 
3. IP/UDP 
366-373 M PREPEND O IPU UDP [] 1-8 | [] 
mbuf| | mbu | 28 23.1] 
M DONTWAIT IP 
M PREPEND 
M WAIT 
23.6.1 IP/UDP mbuf 
M_PREPEND mbuf| sosend 
56 (max_hdr 7-17) IP[] UDP 
M_PREPEND mbuf[| M_PREPEND 
M_LEADINGSPACE mbuf| 
#define M_LEADINGSPACE (m) \ 
((m)->m flags € M EXT ? /* (m)->m_data - (m)-»m ext buf */ 0: N 
(m)->m flags & M PKTHDR ? (m)->m data - (m)->m_pktdat : \ 
(m)->m data - (m)->m dat) 
0 
M PREPEND mbu 
sosend | 
M. LEADINGSPACE[] J] O (2.90 ) 
00000 i 
UDP udp_output TCP 
( ) 
tcp_output M_LEADINGSPACE sosend 
56 tcp_output MGETHDR 
mbu 
23.6.2 UDP[ 
udp output[] [J 0 O UDP IP/UDP 
UDP | IP/UDP | IP 
ipovly 
23-16 udp output m mbu 28 IP/UDP 
udp_output ip_output 
UDP IO U (1) 12 0 [] IP 
(2)8 UDP (3)UDP 23-17 12 
UDP UDP UDP ([] 23-16) 





















































Chi a*pubecom 230 UDP 613 




























































































BD D DD 0 
(TTL) 


0 23-16 IP/UDPO DO UDPIDUDUUDUDU rero DU D 0 0 D D 


0 15 16 
[5 [ee | sm — 


16 
0 23-17 0000000000000 voran 












































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































UDP (1) (O 23-17) 32 bit 
IP ([] 23-16) 32 bit 8 bit 16 bit (2) 32 
bit Internet 16 bit (8.70 ) 
(3) OTT 32 bit 
udp_output udpiphdr (U 23-11) 23-18 
m mbuf] mbu 
20 IP (5 ui_x1[] ui_pr[] ui_len[] ui_src[] ui_dst) 
32 bit IP 32 bit[] (ui_next[] ui_prev) 
0 
23-19 
1) [| 23-19 23-17 






















































































































































































614 os s China*pub.toM 
rn aan re 


0 15 16 31 
ui x1 ui_pr ui_len 
00000 SU D 0 16] 00000 
ui src 


320 D IP[] D 
ui_dst 

320 10P00 f 
ui_sport ui_dport 
160000 i 16000000 
ui ulen ui sum 
16 UDP] [] 160 UDPI OO 

23-18 ude output [J [| [| udpiphdr 


ooo sn UDP 0 | 
IP UDP OO UDP | UDP (000000 
00000 00000 : 00000 
0000 00000 00000 udpiphår 
U U DD DO U U un 000100000 
next prev xl pr len src dst sport dport ulen sum 


' f oy f d dy 


U IP U U IP DD | UDP | UDP 
go Ak mp Pe oojoo joe 20000 


PQ O " . UDP D | 

























p 





| + 











































































































































































































































































































































































































































































































































































































O 23-19 [0 IPUDP[] 000 Vorm D B DH] D D 
2) udpiphdr 23-11 ( 
ui ) udp output[] mbu mbu 
UDP 
3) IP/UDP 23-16 7 
udp_output 3 udp_output 
6 ip_output 
23-20[] udp output 











































































































23-18) PCB 
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374-387 udpiphdr 



























































































































































UDP UDP 

















































































































China=pubecom "- 615 































































































(len 0) UDP (8) UDP UDP 


ui_len|| ui ulen 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































udp usrreq.c 
374 /* P- 1 
375 * Fill in mbuf with extended UDP header 
376 * and addresses and length put intó network format. 
377 */ 
378 ui - mtod(m, struct udpiphdr *); 
379 ui->ui next = ui-»ui prev = 0; 
380 ui-»ui x1 = 0; 
381 ui->ui pr = IPPROTO UDP; 
382 ui->ui len = htons((u short) len + sizeof(struct udphdr)); 
383 ui->ui src = inp->inp laddr; 
384 ui->ui_dst = inp->inp faddr; 
385 ui->ui sport = inp->inp lport; 
386 ui->ui dport = inp->inp fport; 
387 ui->ui ulen = ui-»ui len; 
388 qe 
389 * Stuff checksum and output datagram. 
390 */ ° 
391 ui->ui_sum = 0; 
392 if (udpcksum) ( 
393 if ((ui->ui_sum = in_cksum(m, sizeof(struct udpiphdr) + len)) == 0) 
394 ui->ui sum = Oxffff; 5 
395 } 
396 ( (struct ip *) ui)->ip_len = sizeof (struct udpiphdr) + len; 
397 ( (struct ip *) ui)->ip_ttl = inp->inp_ip.ip_ttl; /* XXX */ 
398 ((struct ip *) ui)->ip tos = inp-»inp ip.ip.tos; /* XXX */ 
399 udpstat .udps_opackets++; . 
400 error - ip output(m, inp-»inp options, &inp-»inp route, 
401 š: inp->inp_socket->so_options £ (SO_DONTROUTE | SO_BROADCAST), 
402 inp-»inp moptions); ` 
403 if (addr) ( 
404 in pcbdisconnect (inp); 
405 inp->inp_laddr = laddr; 
406 splx(s); 
407 } 
408 return (error); 
udp_usrreq.c 
U 23-20 ude output 0 0 0 0 D 00 0 0 0 D 0 D 0 0 0 IP 
2. 
388-395 0 in_cksum UDP 
( — 10 11.30) 0 0 
16[] 1 0( 1 0 0) 
UDP ( 0) UDP 0(16 
160 1) 
udpcksum([] 23-3) 1 UDP 
4.2BSD udpcksum 0 
3: UDP TTL] TOS 
396-398 ui IP (ip)L] UDP IP 
IP UDP IP/UDP 28 IP 








































































































































































































616 






































China-pup.com 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
ip_output 
IP | U TTL[] TOS PCB UDP] [| 
setsockopt — IP TTL[] TOS — 
UDP 
ip output 
4. 
400-402 ip output inp. options setsockopt 
IP IP ip output IP | 
PCB ip output 
SO DONTROUTE( ) |] SO BROADCAST( ) 
2 
403-407 in pcbdisconnect IP 
PCB 
23.7 udp input[|[] 
UDP 23-14 
IP UDP IP 
| | UDP IP ({] 8-15) pr input 
udp input IP udp input 
udp input UDP 
udp input 
1) UDP 
2) UDP PCB 
3) UDP 
Net/3 | 
23.7.1 00 UDP 0 
23-21[] UDP 
55-65 udp input m IP mbuf 
iphlen[] IP ( IP ) 
1. IP 
67-76 IP ip_stripoptions UDP 
IP | IP_RECVOPTS 
| 
77-88 mbuf mbuf 28 (IP UDP ) 
m_pullup mbu 28 mbu 

































































































































































Chinaspubecom "n 617 










































































"ES udp usrreq.c 
56 udp input(m, iphlen) 
57 struct mbuf *m; 
58 int iphlen; 
59 ( 
60 struct ip *ip; 
61 Struct udphdr *uh; 
62 struct inpcb *inp; 
63 Struct mbuf *opts - 0; 
64 int len; 
65 struct ip save ip; 
66 udpstat.udps ipackets++; 
67 /* f 
68 * Strip IP options, if any; should skip this, 
69 * make available to user, and use on returned packets, 
70 * but we don't yet have a way to check the checksum 
71 * with options still present. i 
72 */ 
73 if (iphlen > sizeof(struct ip)) ( 
74 ip stripoptions(m, (struct mbuf *) 0); 
75 iphlen = sizeof(struct ip); 
76 ) 
77 /* 
78 * Get IP and UDP header together in first mbuf. 
79 */ i 
80 ip = mtod(m, struct ip *); 
81 if (m->m len < iphlen + sizeof(struct udphdr)) { 
82 if ((m = m_pullup(m, iphlen + sizeof(struct udphdr))) == 0) 1 
83 udpstat .udps_hdrops++; 
84 return; 
85 } 
86 ip = mtod(m, struct ip *); 
87 } 
88 uh = (struct udphdr *) ((caddr_t) ip + iphlen); 
89 /* f 
90 * Make mbuf data length reflect UDP length. 
91 * If mot enough data to reflect UDP length, drop. 
92 */ i 
93 len = ntohs((u short) uh->uh_ulen); 
94 if (ip->ip_len != len) { 2 
95 if (len > ip->ip_len) { 
96 udpstat .udps_badlen++; 
97 goto bad; 
98 H 
99 m_adj(m, len - ip->ip_len); 
100 /* ip->ip_len = len; */ 
101 } 
102 /* 
103 * Save a copy of the IP header in case we want to restore 
104 * it for sending an ICMP error message in response. 
105 */ : 
106 save_ip = *ip; 
107 /* 
108 * Checksum extended UDP header and data. 
109 */ 
110 if (udpcksum && uh->uh sum) { 


0 23-21 udp input [000000 UDPD D 0 0 0 0 D U 












































618 TCP/IP 2 Chinapub.tom 
— ___ 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































111 ((struct ipovly *) ip)->ih next = 0; 
112 ((struct ipovly *) ip)->ih prev = 0; 
113 ((struct ipovly *) ip)->ih_x1 = 0; 
114 ((struct ipovly *) ip)->ih len = uh-»uh ulen; 
115 if (uh->uh sum = in cksum(m, len + sizeof(struct ip))) í 
116 udpstat.udps badsum++; 
117 m_freem(m); 
118 return; 
119 } 
120 } 
— udp usrreq.c 
U 23-21 (U) 
2. UDP 
333-344 UDP IP (ip len)[] UDP 
(uh ulen) ipintr udp input ip len IP 
(U 10-11) 
1) ip len uh ulen 
2) ip len uh ulen[] IP 23-22 
(UDP JU m. adj m adj 
2-20 mbuf UDP 
UDP 
IP IP 
IP IP 
e— mn — 
IP] O UDP] D UDP D 
| | UDP [] uh_ulen 
IPD O ip ien[] 0 IPD D 0 D 
[] 23-22 UDP OOO 
3) ip_len uh_ulen UDP IP 23-23 
UDP 

































































































































































































































































UDP UDP UDP 


e nn — —& 
E EN 


POO ip ten] D 1.0000 


D 23-23 UDPO OOO 







































































UDP 28 TCP 
— IP IP[] TCP 

















































































































































































































































































































China*pubeeon 619 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































UDP 

UDP 

3. IP UDP 
102-106 udp input IP IP 
110 UDP (udpcksum) UDP ( 

0) 
udpcksum 
UDP 

111-120 IP ipovly ([] 23-18) 

udp_output UDP ( ) 

IP 
23.1.2 
23-24 










































































































































































udp usrreq.c 





206 /* 

207 * Locate pcb for unicast datagram. 

208 c EL 

209 inp - udp last inpcb; 

210 if (inp-»inp lport !- uh-»uh dport || 

211 inp->inp fport !- uh->uh sport || 

212 inp->inp faddr.s addr != ip-»ip src.s addr || 

213 inp->inp laddr.s addr !- ip-»ip dst.s addr) { 

214 inp - in pcblookup(&udb, ip-»ip src, uh-»uh sport, 
215 ip-»ip dst, uh->uh dport, INPLOOKUP WILDCARD) ; 
216 if (inp) 

217 udp last inpcb - inp; 

218 udpstat .udpps_pcbcachemiss++; 

219 } 

220 if (inp == 0) { 

221 udpstat .udps_noport++; 

222 if (m->m flags & (M_BCAST | M_MCAST)) ( 

223 udpstat .udps_noportbcast++; 

224 goto bad; 

225 } 

226 *jp = save_ip; 

227 ip->ip_len += iphlen; 

228 icmp_error (m, ICMP_UNREACH, ICMP_UNREACH_PORT, 0, 0) H 
229 return; 

230 } 





udp_usrreg.c 


O 23-24 udpinput []DO 0 DO D D 0 0 


620 

























































































China-pub.com 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
1. “ u 
206-209 UDP Internet PCB 
udp last inpcb in_pcblookup UDP PCB 
PCB E 7 
(one-behind cache)[Partridge[] Pink 1993] 
[Mogul 1991] 4.3BSD 
Tahoe 
210-213 PCB PCB 
“ ji [Partridge[] Pink 
1993] UDP 
UDP UDP sendto 
PCB inp laddr[| inp. faddrå] inp_fport 
PCB 
UDP 
bsdi udpps_pcbcachemiss 41 253[] udps_ipackets 
42 485 3% 
netstats udpstat (O 23-5) 
Net/3 udpps_pcbcachemiss 
2. UDP[] PCB 
214-218 | in pcblookup 
INPLOOKUP WILDCARD PCB 
udp last inpcb UDP PCB 
3. ICMP 
220-230 PCB[] UDP ICMP 
mbu m_flags | 
IP ICMP 
ICMP IP (save_ip) 
IP 
icmp_error 
udps_noportbcast 
udps_noport 
iphlen ip_len icmp_error 
ICMP IP IP 20 Traceroute 
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(1 8[] ) ICMP 
23-25 PCB 
ST = udp_usrreq.c 
232 * Construct sockaddr format source address. 
233 * Stuff source address and datagram in user buffer. 
234 */ 
235 udp_in.sin_port = uh->uh sport; 
236 udp_in.sin_addr = ip->ip_src; 
237 if (inp->inp_flags & INP_CONTROLOPTS) { 
238 struct mbuf **mp = £opts; 
239 if (inp->inp_flags & INP_RECVDSTADDR) { 
240 *mp = udp saveopt((caddr t) & ip->ip_dst, 
241 sizeof (struct in addr), IP RECVDSTADDR); 
242 if (*mp) 
243 mp = &(*mp)->m next; 
244 } 
245 #ifdef notyet 
246 /* IP options were tossed above */ 
247 if (inp->inp_flags & INP_RECVOPTS) { 
248 *mp = udp_saveopt ( (caddr_t) opts_deleted_above, 
249 sizeof (struct in addr), IP_RECVOPTS); 
250 if (*mp) 
251 mp = &(*mp)->m next; 
252 } 
253 /* ip sreroute doesn’t do what we want here, need to fix */ 
254 if (inp->inp_flags & INP_RECVRETOPTS) { 
255 *mp = udp_saveopt ((caddr_t) ip srcroute(), 
256 sizeof (struct in_addr), IP RECVRETOPTS); 
257 if (*mp) 
258 mp = &(*mp)->m next; 
259 } 
260 #endif 
261 } 
262 iphlen += sizeof(struct udphdr); 
263 m->m_len -= iphlen; 
264 m->m_pkthdr.len -= iphlen; 
265 m->m_data += iphlen; 
266 if (sbappendaddr (&inp->inp_socket->so_rev, (struct sockaddr *) &udp_in, 
267 m, opts) == 0) { 
268 udpstat .udps_fullsock++; 
269 goto bad; 
270 } 
271 sorwakeup (inp->inp_socket) ; 
272 return; 
273 bad: 
274 m_freem(m); 
275 if (opts) 
276 m freem(opts); 
277 ) 
udp usrreq.c 


0 23-25 ude imw D D 0 0 0.0 0 0 D 00.0 D U 


























































































































231-236 IP IP sockaddr_in 
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TCP/IP 2 
udp_in sbappendaddr 
IP udp_input 
ipintr sbappendaddr 
mbuf 
5. IP_RECVDSTADDR 
337-244 INP_CONTROLOPTS 
recvmsg (O 22-5)[] IP. RECVDSTADDR UDP 
IP udp_saveopt MT_CONTROL 
mbuf 4 IP 23.8 
4.3BSD Reno TFTP 
IP ( 23.6) 
4.4BSD 
23-26 
6. 
245-260 IP_RECVOPTS 
IP IP_RECVRETOPTS 
IP_RECV mp mbuf 
sbappendaddr 23-25 
mbuf[] m next 
7. 
262-272 (m mbuf[] ) IP 
(udp_in) (opts mbu IP ) 
sbappendaddr 
mbu UDP[] IP sorwakeup 
8. 
273-276 UDP udp input bad 
( VT mbu 
23.7.3 | | 
udp input IP 23-26 
121-138 
UDP UDP 
( ICMP ) 22-11 
139-145 IP sockaddr_in udp_in 
sbappendaddr mbu UDP[] IP 
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- - - udp usrreq.c 
121 if (IN MULTICAST(ntohl(ip->ip dst.s addr)) || 
122 in broadcast (ip->ip dst, m->m_pkthdr.rcvif)) ( 
123 Struct socket *last; 
124 /* 
125 * Deliver a multicast or broadcast datagram to *all* sockets 


126 * for which the local and remote addresses and ports match 
127 * those of the incoming datagram. This allows more than 
128 * one process to receive multi/broadcasts on the same port. 
129 * (This really ought to be done for unicast datagrams as 
130 * well, but that would cause problems with existing 

131 * applications that'open both address-specific sockets and 
132 * a wildcard socket listening to the same port -- they would 
133 * end up receiving duplicates of every unicast datagram. 
134 * Those applications open the multiple sockets to overcome an 
135 * inadequacy of the UDP socket interface, but for backwards 
136 * compatibility we avoid the problem here rather than 

137 * fixing the interface. Maybe 4.5BSD will remedy this?) 
138 */ 

139 /* 

140 * Construct sockaddr format source address. 

141 */ 

142 udp in.sin port - uh-»uh, sport; 

143 udp in.sin addr = ip-»ip src; 

144 m->m len -= sizeof(struct udpiphdr); 

145 m-»m data += sizeof(struct udpiphdr); 

146 /* 

147 * Locate pcb(s) for datagram. 

148 * (Algorithm copied from raw intr().) 

149 */ 

150 last - NULL; ` 

151 for (inp = udb.inp_next; inp != &udb; inp = inp->inp_next) { 
152 if (inp->inp_lport != uh->uh_dport) 

153 continue; 

154 if (inp->inp_laddr.s_addr !- INADDR ANY) { 

155 if (inp->inp_laddr.s_addr != 

156 ip->ip_dst.s_addr) 

157 continue; 

158 } 

159 if (inp->inp_faddr.s_addr != INADDR_ANY) { 

160 if (inp->inp_faddr.s_adär != 

161 ip->ip_src.s_addr | | 

162 inp->inp fport != uh->uh sport) 

163 continue; 

164 } 

165 if (last != NULL) { 

166 struct mbuf *n; 

167 if ((n = m_copy (m, 0, M COPYALL)) != NULL) ( 

168 if (sbappendaddr (&last->so_rev, 

169 (struct sockaddr *) &udp_in, 
170 n, (struct mbuf *) 0) == 0) { 
171 m_freem(n); 

172 udpstat .udps_fullsock++; 

173 } else 

174 sorwakeup (last); 

175 } 

176 } 

177 last = inp->inp_socket; 


U 23-26 udp input J)00000000000 
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178 /* 
179 * Don't look for additional matches if this one does 
180 * not have either the SO_REUSEPORT or SO REUSEADDR 
181 * socket options set. This heuristic avoids searching 
182 * through all pcbs in the common case of a non-shared 
183 * port. It assumes that an application will never 
184 * clear these options after setting them. 
185 */ 
186 if ((last->so options € (SO_REUSEPORT | SO_REUSEADDR) == 0)) 
187 break; 
188 } 
189 if (last == NULL) ( 
190 i . 
191 * No matching pcb found; discard datagram. 
192 * (No need to send an ICMP Port Unreachable 
193 * for a broadcast or multicast datgram.) 
194 */ 
195 udpstat .udps_noportbcast++; 
196 goto bad: 
197 } 
198 if (sbappendaddr(&last->so rcv, (struct sockaddr *) &udp in, 
199 m, (struct mbuf *) 0) == 0) 1 
200 udpstat .udps fullsock++; 
201 goto bad; 
202 ) 
203 sorwakeup (last); 
204 return; 
205 } 
udp usrreq.c 
0 23-26 (O) 
146-164 for | UDP PCB PCB 
in pcblookup PCB PCB 
PCB PCB 
IP PCB 
IP 
IP 
in pcblookup 
165-177 (Jast ) 
sbappendaddr mbu m_copy sorwakeup 
last socket 
last m_copy ( mbu ) 
for last 
PCB sbappendaddr[] mbu — 
178-188 SO_REUSEPORT|| SO_REUSEADDR 
sbappendaddr 
189-197 last ICMP 
IP 








23 UDP 
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198-204 ( ) (m) 
sorwakeup udp input 
(U 23-24) 
23.7.4 UDP] Å 
UDP 
IP 
23-27 
PPPO O 
000000 
0000 00000 
UU UDP 
140.252.1.29 .13.35 | O O O 140.252.13 I 
1 I 
red UDP O 0 O O 1P=140.252.1.29 L 
HA e ee eee = | I 
pl I 
Sousa AE mens Y 
I 
t ICMP] OOOO zi 
0 23-27 poda UPP) O0000000000000000 
1) bsdi UDP 140.252.1.29 sun PPP 
Sun IP (sun 
) 
UDP 
2) UDP 
(140.252.13.33) IP IP 
bsdi IP UDP 
3) bsdi ICMP ( bsdi 
) 
IP IP 
—— 23.10 28-16 
TCP IP 
IP IP 
23.8 udp_saveopt[] || 
IP_RECVDSTADDR udp_input udp_saveopt 
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*mp = udp_saveopt ((caddr t) & ip dst, sizeof(struct in_addr), 
IP RECVDSTADDR) ; 
23-28 
udp usrreq.c 
278 /* i 
279 * Create a "control" mbuf containing the specified data 
280 + with the specified type for presentation with a datagram. 
281 */ 
282 struct mbuf + 
283 udp saveopt (p, size, type) 
284 caddr t p; 
285 int size; 
286 int type; 
287 ( 
288 struct cmsghär *cp; 
289 struct mbuf *m; 
290 if ((m = m get (M_DONTWAIT, MT_CONTROL)) == NULL) 
291 return ((struct mbuf *) NULL); 
292 cp = (struct cmsghär *) mtod(m, struct cmsghdr *); 
293 bcopy (p, CMSG_DATA (cp), size); ` 
294 size += sizeof(*cp); 
295 m->m_len = size; 
296 cp->cmsg_len = size; 
297 cp->cmsg_level = IPPROTO_IP; 
298 cp->cmsg_type = type; 
299 return (m); 
300 } 
udp_usrreq.c 
U 23-28 ude saveoet 0000000000 mbuf 
mbuf {} 
NULL 
m_nextpkt NULL 
16 
200 O 
MT_CONTROL 
0 
cmsg_len 16 
cmsg_level IPPROTO_IP 
cmsg type iP rECVbSTADDR (16000000 
0 0 roo 
023-29 OO00000000000000000000 mbut 
276-286 p mbu ( IP ) 
size ( 4[] IP ) type 
(IP_RECVDSTADDR) 
290-299 mbuf M DONTWAIT 
cp mbu cmsghdr (O 16-14) bcopyl] IP 
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IP cmsghdr cmsghdr mbu 
( 16) 23-29[] mbuf| 
cmsg_len | [] emsghdr (12) cmsg data ( 4) 
recvmsg cmsghdr cmsg data 
















































































































































































23.9 udp ctlinput[|[] 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































icmp input ICMP ( 
) pr ctlinput 
if (ctlfunc = inetsw[ ip protox[icp->icmp ip.ip p] ].pr_ctlinput) 
(*ctlfunc) (code, (struct sockaddr *)&icmpsrc, &icp->icmp ip); 
UDP 22-32 udp ctlinput 23-30 
314-322 cmd 11-19 PRC xxx) sa sockaddr in 
ICMP IP ip IP 
ip IP pfctlinput 
(Y 22-321] [| udp ctlinput sa sockaddr in 
ip 22.11 
TCP[] UDP 
IP 
323-325 PRC xxx inetctlerrmap 
ICMP | | ICMP[] [] | 
1) icmp input[] ICMP PRC xxx 
2) [| PRC. xxx 
3) Internet PCB (TCP[] UDP)[] inetctlerrmap[] PRC xxx Unix 
errno 
udp usrreg.c 
314 void m 7 
315 udp_ctlinput (cmd, sa, ip) 
316 int cmd; 
317 struct sockaddr “sa; 
318 struct ip *ip; 
319 1 
320 struct udphdr *uh; 
321 extern struct in_addr zeroin addr; 
322 extern u_char inetctlerrmap[]; 
323 if (!PRC IS REDIRECT(cmd) Ek, 
324 ((unsigned) cmd >= PRC NCMDS || inetctlerrmap[cmd] == 0)) 
325 return; 
326 if (ip) ( 
327 uh = (struct udphdr *) ((caddr t) ip + (ip->ip hl << 2)); 
328 in pcbnotify(&udb, sa, uh-»uh dport, ip-»ip src, uh->uh sport, 
329 cmd, udp notify); 
330 ) else 
331 in pcbnotify(&udb, sa, 0, zeroin addr, 0, cmd, udp notify); 
332 ) 
udp usrreg.c 


0 23-30 udp ctlinput [DD D D D Ú Ú CMPT O 
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11-1 11-2 ICMP 
23-30 UDP ICMP 
icmp_input[] ICMP[] [] | PRC QUENCH udp ctlinput 
11-2 ICMP errno 
326-331 in pcbnotify ICMP PCB udp_ctlinput 
UDP IP in pcbnotify 
udp_notify 
in_pcbnotify in_pcbnotify 
PCB UDP udp_notify 23-31 
301-313 errno so_error 
| select | 
: : udp usrreq.c 
305 static void 
306 udp notify(inp, errno) 
307 struct inpcb *inp; 
308 int errno; 
309 ( 
310 inp->inp socket-»so error = errno; 
311 Ssorwakeup(inp-»inp socket); 
312 sowwakeup (inp->inp. socket); 
313 ) 
udp usrreq.c 
U 23-31 udp notify] 000000000000 
23.10 udp usrreq[]|[] 
| 23-14 UDP 
PRU SEND UDP | 
23-32 udp_usrreq switch 15-17 
udp usrreg.c 
417 int p- q 
418 udp usrreg(so, req, m, addr, control) 
419 struct socket *so; 
420 int reg; 
421 struct mbuf *m, *addr, *control; 
422 1 
423 struct inpcb *inp = sotoinpcb(so); 
424 int error = 0; 
425 int S; i 
426 if (req == PRU CONTROL) 
427 return (in control(so, (int) m, (caddr t) addr, 
428 (struct ifnet +) control)); 
429 if (inp == NULL && reg != PRU_ATTACH) { 
430 error = EINVAL; 
431 goto release; 
432 ] 


DH 23-32 ude usrreq [DD 
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433 LE 

434 * Note: need to block udp input while changing 
435 * the udp pcb queue and/or pcb addresses. 

436 */ 

437 switch (reg) ( 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































dn 

522 default: 

523 panic("udp usrreq"); 

524 } 

525 release: 

526 if (control) { 

527 printf("udp control data unexpectedly retained\n"); 

528 m_freem(control); 

529 } 

530 if (m) 

531 m_freem (m); 

532 return (error); 

533 } 

udp usrreq.c 
DH 23-32 (0O) 
417-428 PRU_CONTROL ioctl in_control 
429-432 inp PCB PCB 
(PRU_ATTACH) 
433-436 UDP PCB splnet 
udp_usrreg PCB 
UDP ([] IP ) PCB 
UDP in pcblookup UDP 
case 23-33 PRU ATTACH Socket 

438 case PRU, ATTACH: udp usrrege 

439 if (inp !- NULL) ( 

440 error - EINVAL; 

441 break; 

442 ) 

443 S = splnet(); 

444 error = in_pcballoc (so, &udb); 

445 splx(s); 

446 if (error) 

447 break; 

448 error = soreserve(so, udp_sendspace, udp_recvspace); 

449 if (error) 

450 break; 

451 ((struct inpcb +) so->so_pcb)->inp_ip.ip_ttl = ip defttl; 

452 break; 

453 case PRU DETACH: 

454 udp det ach (inp); 

455 break; 

udp usrreq.c 





O 23-33 udp usrreq [] [| [| PRU ATTACH [| PRU DETACH [| [J 
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PRU_ACCEPT 


















































TCP/IP 2 
438-447 PCB EINVAL[] in_pcballoc 
PCB UDP PCB PCB 
448-450 soreserve 16-7 
soreserve | 
9216 (udp. sendspace)[] 41 600 (udp_recvspace) 9200 
(L] NFS 8 KB ) 16 sockaddr_in 
40[] 1024 setsockopt 
451-452 setsockopt PCB IP TTL[] TOS 
TTL 64(ip_deftt1)[] TOS od 0 ) in  pcballoc[] PCB 
453-455 close PRU DETACH 23-34 udp detach 
PRU ABORT 
534 static void udp_usrreq.c 
535 udp_detach (inp) 
536 struct inpcb *inp; 
537 { 
538 int s = splnet(); 
539 if (inp == udp_last_inpcb) 
540 udp last inpcb = &udb; 
541 in_pcbdetach(inp); 
542 splx(s); 
543 ) 
udp_usrreq.c 
0 23-34 ude detach [| [ H 0 0 O 0 UDP PCB 
PCB C 7 ) PCB 
UDP (udb) in pcbdetach[] UDP PCB PCB 
udp_usrreq|| PRU. BIND bind PRU LISTEN 
listen 23-35 
456-460 in pcbbind PRU BIND 
461—463 PRU LISTEN — 
udp usrreq.c 
456 case PRU BIND: 
457 S = splnet(); 
458 error = in pcbbind(inp, addr); 
` 459 splx(s); 
460 break; 
461 case PRU_LISTEN: 
462 error = EOPNOTSUPP; 
463 break; 
udp_usrreq.c 
0 23-35 udp_usrreq [] [| [| PRU BIND [| PRU LISTEN [| [] 
UDP ( JO O connect 
IP 23-6 PRU_CONNECT|| PRU_CONNECT2 
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23 


UDP 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































464-474 EISCONN 
UDP connect PRU_CONNECT 
PRU_DISCONNECT in_pcbconnect 
soisconnected 
475-477 socketpair PRU. CONNECT2 Unix 
478-480 PRU, ACCEPT accept 
udp usrreq.c 
464 case PRU CONNECT: 
465 if (inp->inp faddr.s addr !- INADDR ANY) { 
466 error - EISCONN; 
467 break; 
468 } 
469 s = splnet(); 
470 error = in_pcbconnect (inp, addr); 
471 splx(s); 
472 if (error == 0) 
473 soisconnected (so); 
474 break; 
475 case PRU_CONNECT2: 
476 error = EOPNOTSUPP; 
477 break; 
478 case PRU_ACCEPT: 
479 error = EOPNOTSUPP; 
480 break; 
udp_usrreq.c 
O 23-36 udp_usrreq [J] O [| PRU[] CONNECT [] PRU [] CONNECT2 [] PRU [] ACCEPT [| [] 
UDP PRU_DISCONNECT 
1) UDP PRU_DETACH PRU_DISCONNECT 
2) UDP connect soconnect[] PRU CONNECT 
PRU DISCONNECT 
PRU DISCONNECT 23-37 
udp usrreq.c 
481 case PRU DISCONNECT: 
482 if (inp-»inp faddr.s addr == INADDR ANY) { 
483 error - ENOTCONN; 
484 break; 
485 3 
486 s = splnet(); 
487 in_pcbdisconnect (inp); 
488 inp->inp laddr.s addr = INADDR ANY; 
489 splx(s); 
490 so->so_state &= "Së ISCONNECTED; /* XXX */ 
491 break; 
udp usrreg.c 
U 23-37 udp usrreq [| [| [| PRU_DISCONNECT [0 
ENOTCONN in pcbdisconnect IP 
0.0.0.0 0 0.0.0.0 connect 
PCB 
shutdown PRU. SHUTDOWN UDP 

































































































































































632 

































































































































































China-bubcom 







































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
23-38 PRU_SHUTDOWN|| PRU SEND 
PRU ABORT 
492-494 socantsendmore 
495-496 23-14 | udp surreq PRU SEND | udp 
output udp usrreq release ([] 23-32) 
mbuf[] (m)[] IP mbu 
mbu 
————— ——AOI —— HIH usrreq.c 
492 case PRU_SHUTDOWN: 
493 socantsendmore (so); 
494 break; 
495 case PRU_SEND: : 
496 return (udp output (inp, m, addr, control)); 
497 case PRU_ABORT: f 
498 soisdisconnected(so); 
499 udp_detach (inp); 
500 break; 
—  " —. HHH HSG C 
O 23-38 ude usrreg [|] [| [| [| PRU [] SHUTDOWN [| PRU [] SEND [] PRU [] ABORT [] [| 
UDP 
sosend udp usrreg udp output 23-20 
udp output ip outputl| ip output ether output 
( JOD sendto 
ether output ENOBUFS 
497-500 UDP PRU_ABORT PCB 
PRU_SOCKADDR|| PRU PEERADDR getsockname 
getpeername PRU SENSE 23-39 
udp usrreg.c 
501 Case PRU, SOCKADDR: 
502 in_setsockaddr(inp, addr); 
503 break; 
504 case PRU_PEERADDR: 
505 in_setpeeraddr (inp, addr); 
506 break; : 
507 case PRU_SENSE: 
508 JE 
509 * fstat: don't bother with a blocksize. 
510 */ 
511 return (0); 
udp usrreq.c 
U 23-39 ude usrreq [ O O O PRU [] SOCKADDR [] PRU[] PEERADDR [| PRU[] SENSE [] [] 
501-506 in setsockaddr[] in setpeeraddr[] PCB 
addr 
507-511 fstat PRU SENSE OK 
TCP stat st blksize 
23-40 7|] PRU. xxx | UDP 
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PRU RCVD mbu (m 
) PRU_RCVOOB mbu 
switch mbuf| PRU RCVOOB mbu 
udp usrreq.c 
512 case PRU SENDOOB: 
513 case PRU FASTTIMO: 
514 case PRU SLOWTIMO: 
515 Case PRU, PROTORCV: 
516 Case PRU PROTOSEND: 
517 error - EOPNOTSUPP; 
518 . break; 
519 case PRU, RCVD: 
520 Case PRU RCVOOB: 
521 return (EOPNOTSUPP); /* do not free mbuf's */ 
udp usrreq.c 





O 23-40 udp usrreg 000000007000 


23.11 udp. sysct1[|[] 
































































































































































































































































































































































































































UDP[| sysctl UDP | 
sysct1(8) UDP 23-41 udp_sysctl 
sysctl_int udpcksum 

I - udp usrreq.c 
547 udp.sysctl(name, namelen, oldp, oldlenp, newp, newlen) 
548 int *name; 
549 u int namelen; 
550 void *oldp; 
551 size t *oldlenp; 
552 void *newp; 
553 size t newlen; 
554 I i 
555 /* All sysctl names at this level are terminal. */ 
556 if (namelen != 1) 
557 return (ENOTDIR); 
558 switch (name[0]) { 
559 case UDPCTL_CHECKSUM: . i 
560 return (sysctl_int (oldp, oldlenp, newp, newlen, &udpcksum)); 
561 default: 
562 return (ENOPROTOOPT); 
563 } 
564 /* NOTREACHED */ 
565 } 
udp_usrreq.c 
0 23-41 udp sysctl [| J 
23.12 OAD 
23.12.1 UDP PCB 0 
22.12 PCB PCB 















































































































































23-24[] UDP = í 
“ ” PCB ( 
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TCP/IP 2 
) [Partridge[] Pink 1993] 
PCB 
PCB 
[Partridge[] Pink 1993] 555 
128.1.2.3 1600 
PCB 128.1.2.3 1600 
(cache hiding) 
PCB PCB 
PCB[] PCB 
555 ( 
) 
[Partridge[] Pink 1993] PCB 
[Mogul 1991] 
PCB[] PCB 
[Partridge[] Pink 1993] 100 000 
UDP 57% PCB 30% PCB 
udp_input CPU 
UDP 
UDP — 
[McKenney[] Dove 1992] (OLTP) 
[Partridge[] Pink 1993] 22.12 
OLTP PCB 
23.122 UDP 
[Net/3 
mbuf[] (uiomove sosend 
) UDP ( in cksum[] udp output ) 
[Partridge[] Pink 1993] 23-14[] UDP UDP 
udp sosend sosend UDP ( 
in cksum ) in uiomove mbuf| 
( uiomove) 
40%[] 45% 
UDP UDP UDP 
soreceive 
(udp soreceive) 
udp soreceive 
EWOU BLOCK UDP 
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1) select UDP 
EWOULDBLOCK 
2) 
100 
40 recvfrom 40 60 
[Partridge[] Pink1993] 
CPU RISC 
23.13 En 
UDP TCP UDP 
IP[] UDP ip_output 
UDP UDP 26 
TCP 
udp_input ( ) 
IP 
Internet PCB UDP 
udp_ctlinput ICMP udp usrreq 
PRU xxx| 
U U 
23.1 udp output ip output[] mbuf| ( sosend) 
23.2 IP! 
23.3 UDP bind 
23.4 23-15 M_PREPEND udp_output 
23.5 udp_output 0 OL] UDP 
23.6 IP_RECVDSTADDR 
23.7 udp saveopt([] 23-38) mbu 
23.8 UDP connect 
sendto 
23.9 22-25 | IP 255.255.255.255 connect[| UDP 
IP UDP 
255.255.255.255 sendto 










































































































































































China-pubs 
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TOPO D UL EL EL E] U 






















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































24.1 DU 
R 0 00 Teen D Ú 000000 U 
u | | | 000000 ul | U 0 UDP 
23 UDP{[] 9 800[] C 
TCP 28 4500[] C 0 TCP 7 l L LU 
O | O TCP 0000 | OO 100 170 -D 240000 TCP 
LU U U 
24.2 9000 
TCP 7 TCP 6] C O O TCP 
lT] | 24-1 
U [] Ë Ë 
netinet/tcp.h tcphdr[] 000 
netinet/tcp debug.h tcp. debug 000 
netinet/tcp fsm.h TCP Hl d d B D DÚ 
netinet/tcp seg.h H H TCP H H H H H H 
netinet/tcp timer.h TCP) 00090 
netinet/tcp var.h tcpcb (000 ) 0 tepstat (000000 
netinet/tcpip.h TCP-IP O00 
netinet/tcp debug.c OO so_pvEsucl JUD DDD (27.100) 
netinet/tcp input.c tcp input] 00000 G 280 O 290) 
netinet/tcp output.c tcp output 0000040260) 
netinet/tcp_subr.c DO TCP HB (0270) 
netinet/tcp_timer.c TCP 0000 (0250 ) 
netinet/tcp usrreq.c PRU. xxx[] 00 0 300 ) 
U 24-1 TCO 0000090090 
02420 000 TCPE ODO ul U U D U U U U 00060! 
LU U SU 000 TcPD 000080000 protoswl UU GO 24-80 0 9 tcp output [] 


24.2.1 








































































































24-3 





TCP 
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0000000 000000 getsockopt 


setsockopt 


domaininit 






































































































































0 242 TCPO 000000000000 
0 U u au Ë [] 
tcb struct inpcb TCP Internet PUT J 
tcp. last inpcb struct inpcb *| JIOO0000000POGBG000 0000" 0000 
tcpstat struct tcpstat TCP) 0 [] O (0 24-4) 
tcp_outflags u_char O0O00000000000 C 24-16) 
tcp_recvspace u_long OO000000000 819200) 
tcp sendspace u long U U U 0 UU UU UU U (819200) 
tcp iss tcp. seq TCP] 0 D D H] dss) 
tcprexmtthresh int AC I0O00000GO0000000 
tcp mssdflt int O O MSSQ (5120 [] ) 
tcp rttdflt int 00000 RTTD D 0 D GO) 
tcp. do rfrc1323 int O0O00G00)0000000000000 
tcp now u long 0 O RFC 13230 0 0000 500 ms] O O 
tcp_keepidle int pago 00000000 200) 
tcp_keepintvl int O0O000000000000060) 
tcp maxidle int D D DDD DDD D DDD DDD (1000) 
0243 11 D.D D.D UD 00 00N 
24.2.2 



































tcpstat TCP | 24-4 









































































































































































































































































































































tcpstat[] [] O O SNMP[] [] 








tcps_accepts 


HO 
HO 


000000) 


(0 O connect) . 


0000 (SYND uto» . 
(OO connect] JJ ) 


tcps_closed 
tcps_connattempt 
tcps_conndrops 


L3 r3 0 
= 


tcps_connects 


D 
e 


tcps delack 


a 
FG 


D SYNDOD) š 
0 (0000000 SYN 


tcps_drops 
tcps_keepdrops 
tcps_keepprobe 


vu 

š 

n 
Onooo 
r3 





2o 
Og C C0 C G C o 


D DDD DD D 


tcps keeptimeo 


tcps_pawsdrop 


"d 
O 
= 


tcps_pcbcachemiss 


tcps_persisttimeo 





Q ol 
oy =! 
Oo 


tcps_predack 


tcps_preddat 


> Og O 0 

ra EH 4 0 G A G G G 
c3 H rm 

o o 

oOo 


Qn 
A 


tcps_rcvackbyte 











A^ 
CH 
oo! 
L3 L3 L3 D D L3 C3 C3 C3 B3 C D C D C C3 oo Do Do EH 


tcps rcvackpack 
tcps rcvacktoomuch OOO ACKT ODO 
tcps rcvafterclose 


tcps rcvbadoff 


tcps rcvbadsum 
tcps rcvbyte 


tcps rcvbyteafterwin 








D 
e 
A 


tcps rcvdupack 


























tcps rcvdupbyte 

















tcps rcvduppack 





tcps rcvoobyte 

tcps rcvoopack 

tcps rcvpack 

tcps rcvpackafterwin 
tcps rcvpartdupbyte 


tcps rcvpartduppack 
tcps rcvshort 
tcps rcvtotal 


tcps rcvwinprobe 


tcps rcvwinupd 


5014010 G G AOLO GOG GA E E: EES EEN E EIER > E 


tcps rexmttimeo 


L3 F3 E3 E3 E3 ESP E E3 E3 E3 E3 E3 nganangana Est 3 =i: N 


Si EN EE EN GERE EEN 1 Ed EY E ECH EY E13 L1 0141 E 


a 
4 


tcps_rttupdated 


4 
4 























OOO 
D aqu =0) 


tcps segstimed 
tcps sndacks 
tcps sndbyte 


æ EI Or 
A^ 
E 
El 


SYND FINO RSDD D 0 (0000 =0) 
OO Gogg >9) 
000400000000 10000) 


tcps_sndctrl 
tcps_sndpack 








tcps_sndprobe 
tcps_sndrexmitbyte 
tcps_sndrexmitpack 


tcps_sndtotal 


S G G O G p 


Do@ßooooo 
L3 OD gg y 


(0000 =0) 
(10.000 =0) 


tcps_sndurg 
tcps_sndwinup 


















































OO 00000000 RADO DI DD DD DEE > DC dÉ CC 














tcps timeoutdrop 





D 24-4 tcpstat D 0 TCPO 0 D 
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netstat-s TCP 24-5 
30 E 
— tcps_snd(pack, byte) 
tcps sndpack|| tcps sndbyte 
tcps sndbyte 3 722 884 824 - 22 194 928 
450 tcps rcvackbyte 3 738 811 552 
- 21 264 360 ( 565 ) 
netstat printf %d( ) %lu( 
) 32 
(2?- 124 294 967 295) 





















































tepstat [] [| 


tcps sndtotal 

tops snd (pack, byte} 

tcps, sndrexmit (pack, byte) 
tcps, sndacks,tcps delack 
tcps sndurg 

tcps sndprobe 

tcps, sndwinup 
tcps_sndctrl 


netstat -s 00 


10,655,999 packets sent 
9,177,823 data packets (-22,194,928 bytes) 
257,295 data packets (81,075,086 bytes) retransmitted 
862,900 ack-only packets (531,285 delayed) 
229 URG-only packets 
3,453 window probe packets 
74,925 window update packets 

279,387 control packets 


8,801,953 packets received 
6,617,079 acks (for -21,264,360 bytes} 

235,311 duplicate acks 

0 acks for unsent data 

4,670,615 packets (324,965,351 bytes) rcvd in-sequence 
46,953 completely duplicate packets (1,549,785 bytes) 
22 old duplicate packets 

3,442 packets with some dup. data (54,483 bytes duped) 
77,114 out-of-order packets (13,938,456 bytes) 

1,892 packets (1,755 bytes) of data after window 

1,755 window probes 

175,476 window update packets 

1,017 packets received after close 

60,370 discarded for bad checksums 

279 discarded for bad header offset fields 

0 discarded because packet too short 


















































tcps rcvtotal 
tcps_rcvack(pack, byte) 
tcps, rcvdupack 

tcps rcvacktoomuch 

tcps, rcvípack, byte] 
tcps_rcvdup (pack, byte} 

tops pawsdrop 
tcps_rcvpartdupípack, byte} 
tcps, rcvooípack, byte} 

tcps rcv(pack,bytejafterwin 
tcps rcvwinprobe 

tcps rcvwindup 

tcps, rcvafterclose 
tcps_rcvbadsum 

tcps rcvbadoff 

tcps, rcvshort 
























144,020 connection requests 
92,595 connection accepts 
126,820 connections established (including accepts) 
237,743 connections closed (including 1,061 drops) 
110,016 embryonic connections dropped 
6,363,546 segments updated rtt (of 6,444,667 attempts) 
114,797 retransmit timeouts 

86 connection dropped by rexmit timeout 
1,173 persist timeouts 
16,419 keepalive timeouts 

6,899 keepalive probes sent 

3,219 connections dropped by keepalive 


tcps connattempt 

tcps accepts 

tcps connects 

tcps, closed,tcps drops 
tcps, conndrops 

Sr ENN 
tcps rexmttimeo 
tcps timeoutdrop 
tcps persisttimeo 
tcps_keeptimeo 
tcps_keepprobe 
tcps_keepdrops 




















733,130 correct ACK header predictions 
1,266,889 correct data packet header predictions 
1,851,557 cache misses 


tcps_predack 
tcps_preddat 
tcps pcbcachemiss 








U 24-5 TCP] 9000 





640 


















































Ch 























ina*bub.tom 



















































































































































































































































































































































































TCP/IP[] | Uu 20 
24.2.3 SNMP[] 

[] 24-6[] SNMP TCP 14[] SNMP U lT U T U) 
tepstat 000000000 OOO Ne/30 0000! tepCurrEstab] J [0 
O TCP PCB[] [] Internet PCBO O UL 

O 24-70 0 O tepTable[] O TCP] [| [| (listener table )[] 

SNMP) [] tcpstat[] 0000 H" O 

tcpRtoAlgorithm 4 O0000000000000 

1000 

2=RTOI D D D D 

3=MIL- STD- 17780 0 BO 
4=Van Jacobson] UU Å 

tcpRtoMin 1000 I00000000000000 

tcpRtoMax 64000 I00000000000000 

tcpMaxConn =1 U U 0 0 D U repr D c 10 D D ü np» 

tcpActiveOpens tcps_connattempt N CLOSED] [] O SYN SENT D Ü 

tcpPassiveOpens tcps accepts N LISTEN] [] 0 SYN RCVD[ DD 

tcpAttemptFails tcps_conndrops 0 SYN_SENT[] SYN RCVD[ 0 [| CLOSED] 

O O +0 SYN RCVDO DD LISTEN] OO 
tcpEstabResets tcps_drops [] ESTABLISHED[] CLOSE WAIT] [| 5 
CLOSED] O O 
tcpCurrEstab (000) 0 000 ESTABLISHED[] CLOSE WATT [] 
0000 

tcpInSegs tcps_rcvtotal 000000 

tcpOutSegs tcps sndtotal - 0000000000000 

tcps_sndrexmitpack 

tcpRetransSegs tcps_sndrexmitpack 00000 

tcpInErrs tcps_rcvbadsum + 00000000 

tcps_rcvbadoff + 
tcps_rcvshort 
tcpOutRsts ( Uu» RST[] D D D D D O UU 0 
0246 te] 0000 SNMPQ [] 
index = <tcpConnLocalAddress>.<tcpConnLocalPort>.<tcpConnRemAddress>.<tcpConnRemPort> 
SNMP] [] PCBO O Oo U 
tcpConnState t state 00000 1= CLOSED, 2=LISTEN, 3 = SYN SENT, 
4 = SYN RCVD, 5 = ESTABLISHED,6 = FIN WAIT, 
7 = FIN WAIT 2, 8 = CLOSE WAIT, 9 = LAST ACK, 
10 = CLOSING, 11 = TIME WAIT,12 = [] 0 TCPO OO 
tcpConnLocalAddress inp. laddr O dr O 
tcpConnLocalPort inp lport 00000 
tcpConnRemAddress inp_faddr O O 1P0 0 
tcpConnRemPort inp_fport 000090 
0 24-7 TCPO [| O O tepTable 0000 





Chi à*buf to 





24] TCP 64 I 









































































































































































































































































































































































































































































































































































































































PCB (t. state)[] [| TCP ([] 24-13) Internet PCB 
([] 22-4) 
24.3 TCP [] protoswl] |] 
24-8 TCP protosw| TCP 
0000 inetsw[2] LH O 
pr_type SOCK_STREAM TCP 00000000 
pr_domain &inetdomain TCP[] [] Internet] [] O 
pr_ptotocol IPPROTO_TCP (6) OO POOOip el 
pr_flags PR_CONNREQUIRED|PR_WANTRCVD 000000000000 
pr input tcp input U IP D D 0 
Pr output 0 TcP [1 D B 0 U 0 UO DH 
pr ctlinput tcp ctlinput OOICMPINOOOOOOD 
pr ctloutput tcp ctloutput 0000000000 
pr_usrreg tcp usrreg O0OO0000000 
pr init tcp init TCPO OO 
pr_fasttimo tcp fasttimo U D D D D D D 200 ms 000 
pr_slowtimo tcp_slowtimo 0000000 soom 000 
pr_drain tcp_drain NO mbuff] OO00 
pr sysctl 0 TCP[] B. D D 0 0 UD. U 
[] 24-8 TCP protosw [] [| 
24.4 TCP|[] ND 
tcphdr TCP 24-9 tcphdrl] [| | 24-10[] TCP 
tcp.h 
40 struct tcphdr { 
41 u_short th_sport; /* source port */ 
42 u_short th_dport; /* destination port */ 
43 tcp_seg th_seg; /* sequence number */ 
44 tcp seg th ack; /* acknowledgement number */ 
45 #if BYTE ORDER == LITTLE ENDIAN : 
46 u char th x2:4, /* (unused) */ 
47 th off:4; /* data offset */ 
48 #endif 
49 #if BYTE_ORDER == BIG_ENDIAN ; 
50 uchar th_off:4, /* data offset */ 
51 th x2:4; /* (unused) */ 
52 #endif 
53 u char th flags; /* ACK, FIN, PUSH, RST, SYN, URG */ 
54 u short th win; /* advertised window */ 
55 u_short th sum; /* checksum */ 
56 u short th_urp; /* urgent offset */ 
57 ): 
tcp.h 


0 24-9 tcphar D D 


642 


TCP/IP 2 












































15 16 


th sport 
1600000 
th seq 
320 D 0 


th_ack 


3200000 


th_off 


4 
0000 


China-pub.com 


th_dport : 


16100000 


31 


th x2 uJAIPIRISIF "mm 
oo R|C|S|S|Y|I = 
(60 ) G|K|H| TININ 160000 


th sum th urp 
160 TCPO OO 10 D D D 0 00 D 
«aun 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































[] 24-10 TCP[] [] L1 L1 B LI D 
RFC ( 1) TCP 
th urp í (urgent pointer)” í 
(urgent offset)” 16 bit th_seg 
32 bit ( 
) 24-13 TCP 
32 bit snd_up “ " 
TCP 16 bit " pi 26.6 
TCP 4 bit 6 bit 6 bit C 
4 bit 8 bit 8 bit 
C fifdef 
TCP 4 bit th o££[] “ " C " Ñ 
TCP 32 bit 
th flags 6 24-11 
Net/3 TCP “ IP + TCP "[] tep input IP 
tcp output IP 24-12 tcpiphdr 
IP/TCP 
38-58 23-19 ipovly 20 IP 
(20 ) IP 




































































































































































China-pubeeom "n" 643 






























































th flags O O 





TH_ACK 0000 (th_acxodO n 

TH_FIN 00000000 

TH PUSH | D0O000000000000000 
TH_RST 0000 

TH_SYN 0000 0000) 

TH_URG 0000000 (th—urp)l O 














0 24-11 th flags |] 


















































































































































































































































































































































































































































































































































- tcpip.h 
38 struct tcpiphdr ( 
39 struct ipovly ti i; /* overlaid ip structure */ 
40 struct tcphdr ti t; /* tcp header */ 
41 }; 
42 #define ti next ti_i.ih_next 
43 #define ti_prev ti_i.ih_prev 
44 #define ti x1 ti i.ih x1 
45 #define ti pr ti i.ih pr 
46 #define ti len ti i.ih len 
47 #define ti src ti i.ih src 
48 #define ti, dst ti i.ih dst 
49 #define ti sport ti t.th sport 
50 #define ti dport ti t.th dport 
51 #define ti seq ti t.th seq 
52 #define ti ack ti t.th ack 
53 #define ti x2 ti t.th x2 
54 #define ti, off ti t.th off 
55 #define ti flags ti t.th flags 
56 #define ti win ti t.th win 
57 #define ti sum ti t.th sum 
58 #define ti urp ti t.th urp I 
tcpip.h 
[ 24-12 tcpiphdr 00000000 PTEN U 
24.5 TCPO OD D DÚ 
22-1 Internet PCB TCP tcpcb 
UDP Internet PCB 
TCP| 140 22-1 Internet PCB[] TCP 
24-13 TCP| 
tcp var.h 
41 struct tcpcb ( 
42 struct tcpiphdr *seg next; /* reassembly queue of received segments */ 
43 struct tcpiphdr *seg prev; /* reassembly queue of received segments */ 
44 short t state; /* connection state (Figure 24.16) */ 
45 short t timer[TCPT NTIMERS]; /* tcp timers (Chapter 25) */ 
46 short t rxtshift; /* log(2) of rexmt exp. backoff */ 
47 short t rxtcur; . /* current retransmission timeout (#ticks) */ 
48 Short t dupacks; /* #consecutive duplicate ACKs received */ 
49 u short t maxseg; /* maximum segment size to send */ 
50 char t force; /* 1 if forcing out a byte (persist/OOB) */ 
51 u short t, flags; /* (Figure 24.14) */ 


O 24-13 tee I O O TCO O O 


52 
53 
54 
55 
56 
57 
58 
59 
60 
61 
62 
63 
64 
65 
66 
67 
68 
69 
70 
71 
72 
73 
74 
75 
76 
77 
78 
79 
80 
81 
82 
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100 
101 
102 


103 
104 
105 
106 


107 
108 












































644 ms s China"pub.tom 
ee reven de — — as 


struct tcpiphdr ft template; /* skeletal packet for transmit */ 
struct inpcb *t inpcb; /* back pointer to internet PCB */ 
/ * < 
* The following fields are used as in the protocol specification. 
* See RFC783, Dec. 1981, page 21. 


* 

/* send sequence variables */ 
tcp_seq snd_una; /* send unacknowledged */ 
tcp_seq snd nxt; /* send next */ 
top Sed snd up; /* send urgent pointer */ 
tcp.seq snd wll: /* window update seg seq number */ 
tcp seq snd_wl2; /* window update seg ack number */ 
tcp seq iss; /* initial send sequence number */ 
u long snd_wnd; /* send window */ 

/* receive sequence variables */ j 
u_long rcv_wnd; /* receive window */ 
tcp seq rcv nxt; /* receive next */ 
tcp.seqd rcv up; /* receive urgent pointer */ 
top. seg irs; /* initial receive sequence number */ 

/* i 

* Additional variables for this implementation. 

*/ 

/* receive variables */ 
tcp.seq rcv. adv; /* advertised window by other end */ 

/* retransmit variables */ 
tcp seq snd max; /* highest sequence number sent; 


*.used to recognize retransmits */ 
/* congestion control (slow start, source quench, retransmit after loss) */ 
u long snd_cwnd; /* congestion-controlled window */ 
u long snd ssthresh; /* snd cwnd size threshhold for slow start 
* exponential to linear switch */ 
/* oh a8 
* transmit timing stuff. See below for scale of srtt and rttvar. 
* "Variance" is actually smoothed difference. 


*/ 
short t_idle; /* inactivity time */ 
short t_rtt; /* round-trip time */ 
tcp seq t rtseq; /* sequence number being timed */ 
short t srtt; /* smoothed round-trip time */ 
short t rttvar; /* variance in round-trip time */ 
u.short t rttmin; /* minimum rtt allowed */ 
u long max sndwnd; /* largest window peer has offered */ 
/* out-of-band data */ 
char t oobflags; /* TCPOOB HAVEDATA, TCPOOB HADDATA */ 
char t iobc; /* input character, if not SO OOBINLINE */ 
short t_softerror; /* possible error not yet reported */ 
/* RFC 1323 variables */ 
u_char snd_scale; /* scaling for send window (0-14) */ 
u_char rcv_scale; /* scaling for receive window (0-14) */ 
u_char request r scale; /* our pending window scale */ 
u char requested s scale; /* peer's pending window scale */ 
u long ts recent; /* timestamp echo data */ 
u long ts recent age; . /* when last updated */ 
tcp seq last ack sent; /* sequence number of last ack field */ 
T: 
#define intotcpcb (ip) ((struct tcpcb *) (ip) ->inp_ppcb) 
#define sototcpcb (so) (intotcpcb(sotoinpcb(so))) 
tcp. var.h 


U 24-13 (0) 











TCP| 
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l U utut lu LU LI | U 
24-14] U U t flags 
t_flags [] [] 

TF ACKNOW OO00 Ack 

TF_DELACK 0000 ACK 

TF_NODELAY pp4adg pd 0 00000 00000000 OO Nagle 0 > 

TF_NOOPT HUU Ter] D (0 D 0 D TCPD mun» 

TF_SENTFIN FIND O O 

TF RCVD SCALE | 0 0 0 SYND D D DD D DDD DDD 0 D 

TF RCVD TSTMP | 000 SYND DD 0 B B d ü d Dn 

TF REQ SCALE | DD UDO Svwü 0000000000 

TF REQ TSTMP | 0 D DDD SYND D DD DD 0 0 










































































24.6 TCP[] 00000 











[] 24-14 € flags 90 



























































































































































































































































































































































































































































































































































































































































































































































































































































TCP[] 00000000000 LU U U U U U U) 24-150 l) 
TCP 
LU L) U U U U | TCPO OO00000 TCP 0 | LISTEN] [1 Ú 0 
[] SYN SENT SOCKET API [] Ü | (0 O listen] O 
[| connect) 
TCP 00000 t statel [| OO 24-16] 
|0 0 tcp_outflagsH Hd D D EL CL UI l U U UU Cep output] | 
24-16| L U U l U U U l U U U 
LU LU U (U U | 
#define TCPS HAVERCVDSYN(s) ((s)>=TCPS SYN RECEIVED) 



























































































































































































































































































































































































































































































































































#define TCPS HAVERCVDFIN(s) ((s)>=TCPS TIME WAIT) 
uuu OOOO t_statell [| TCPS ESTABLISHED[|[] tcp. notify[J O 
ICMP 
TCPS, HAVERCVDSYNJ [] L| LE [I LU] IJ UU TCPS_HAVERCVDFIN 0 
| O Y CLOSE WAIT[] CLOSING[] LAST ACK| OOO FIN OM 
29 U uu 
[] shutdown [] 1 = 1] "[] TCP[] [] FIN 
| (0 10 18.5 TCP og 
0 24-150 0 0 ESTABLISHED| IO" | "10000 UU 
iE "[] FIN. WAIT 1 OOOO FIN WAIT 2 DO OO DD 















































































































































646 


send: |RST 






TCP/IP 












































app 0 00 


send: <[] > 


TIME_WAIT 


24.7 TCPODO 


TCP 


TCP 


China-pubecom 


















































SYN 











FIN 
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24-10) 


32 bit 




























































































32 bit 































































































Chinaspubecom o 


rer 647 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































UU u LU U L l U U UD U 00 U U UD 10 U 0 0 0 
LU U 0 ACK LU U 0 0 D D D D D D 0 U | DO ACKT Ú u 
OM 0 uuu SYNU (SYN. SENTI] 24- 
16 tcp outflags[2]) RST ACK 
t_state O 0 O tcp outflags[] 
TCPS CLOSED 0 OO TH RST| TH ACK 
TCPS LISTEN 1 200000400090) 0 
TCPS SYN SENT 2 OHOOSYNG OOO ) TH_SYN 
TCPS_SYN_RECEIVED 3 000000 SYNO DD ACK TH_SYN| TH_ACK 
TCPS_ESTABLISHED 4 0000000) TH_ACK 
TCPS_CLOSE_WAIT 3 I U U FINE BL EL H BH B] UL E] H TH ACK 
TCPS FIN WAIT 1 6 000000 FIND DD ACKO FIN TH FIN|TH ACK 
TCPS CLOSING 7 0000000 ACK TH FIN|TH ACK 
TCPS LAST ACK 8 DOOFNIOOODODO ACK TH_FIN| TH_ACK 
TCPS_FIN_WAIT_2 9 000000 FIN TH_ACK 
TCPS_TIME_WAIT 10 00000 22MSL[ DU og TH ACK 
H 24-16 t state [] D 
TCPÍ 0 LU U U U TCP | 
(U 24-13)[] 130 | 8 ( JO SI IH Bg OOOO) 
24-17[] DOU 4[] snd wnd[] snd_una[] snd_nxt 
snd mazi | | OOOOO 1-0 nd 
snd wnd=6: 00000 
(U DD DDD) 
ET pg 
U D 0 U i 
== 
1 2 3 4 5 6 | 7 8 9 10 11 
00000 
— — > 000000 00000 
000000 A A 0000 
snd una =4 snd nxt =7 
000000 00000600 
u D D 0 
snd_max=7 
D00000- 
02417 QOOO0000 
IU DU ACKU 0 U U UU l 
snd una < [][][][] <= snd max 
24-17 OT | ACK[] | U 50 60 7 IO | 0 
snd una ACK[] | | | snd_unall | 
UU i 
























































648 anu no China+pub.com 
„nn EE 


tcp outputl] 0000 U 


snd_nxt < snd_max 


24-18 24-17 | 4[] 5 















































































































































































































































































































































| rev nxt[] rcv. wnd[] rcv. adv[] 











rcv. wnd- 6: 0000 

























































































































































































































































































































































































































































































(000000) 
1 2 3 4 5 6 7 8 9 10 11 
TCP D D D 0 0 — 
m Å 00000000 
rcv nxt =4 rcv adv = 10 
0000000 f pp4d00001 
02418 00000000 
| || 
rcv nxt <= UU H < rev nxt + rev wnd 
rcv nxt <- 000000 < rev nxt + rev wnd 
TCP ti seq[] TCP[] 
U 10 
24-19 TCP] HI O O 24-17 | l U U U D 0 U 40 SE 6 






























































































































































a 630 D IP[] D DI — 


























































































































































































































= [m] m TJ] 
200 0 8 20 12 III 
0 24-19 TCP OOO IPD 0 0 0 0 0 
IP 8 IP 12 TCP 12-20 
0 H U 0 U 
ip_hl 7 IP] D HPD 000000 32bit0 0 D (=28[] D ) 





ip_len 63 PP 00000000000 (02048 +20+12+3) 
8 TCPO O +TCPO D D D 0 0 D 32 bi 0 0 6320 D ) 
ti seq | 4 DH D DH HH DD H H H 
3 
6 





TCP 000000 ip len- (ip hlX 4)- (ti offx 4) 
O0000000000000 ti seq+ti len-l 

















D 24-20 D 24190 000000 
ti len TCP[] | 0 Ü | 































































































































































































24-20 0 IP 




















AN 








24-12) 






























































































































































24 TCP| 
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TCP 32 0-4 294 967 295 
TCP 2 4 294 967 295 0 
232 0 
0-4 294 967 295 
1 4 294 967 295 
tcp.h TCP unsigned long 
typedef u_long tcp_seg; 
24-21 4 
tcp seg h 
40 #define SEQ LT(a,b) ((int) ((a)-(b)) < 0) 
41 #define SEQ LEQ(a,b) ((int) ((a)-(b)) <= 0) 
42 #define SEQ GT(a,b) ((int) ((a)-(b)) > 0) 
43 #define SEQ GEQ(a,b) ((int) ((a)-(b)) >= 0) 
tcp seg.h 
[ 24-21 TCO H 000 
2. — 
TCP 3 bit[] 0-7 24-22 
8 ( 1 1 0 
1) 
H 24-22 3bi0 000 
0-x[] 1- x[] 2- x ( 
24-21 int) 1 0 
(SEQ LI" 0 0 0 (SEQ. GT[] ) 
24-22 ( “0-x”) 0 11 2l] 31] Ar 1) 
0 5[] ell 7( 0 0) 24-23 
5 6 7 [°] 1 2 3 4 
or p aut or p atu 
q— —nT 


D 24-23 3bit]) TCPOOOOO 


650 























China-pub.com 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP [O 2 
24-22 (1- x) ULUI 24-24 u 
6 7 0 [1] 3 4 5 
II00000 I B D O U 0 
q—— a 
D 24-24 3 bitg TCPH H H D D 
24-25 | | L L 
0 
7 i 1 
6 2 
5 3 
4 
0 24-25 [ 24-230 D 24-24 
TCP L 
TCP | 1 6 6 
5 5 1[] TCP 
21 30 4 ( 5 
24-26 24-25 TCP 32 bit 3 bit 
532 
D EEN 
4294967295 0 1 P 0 `. 
ya Ç 
š \ 
1 \ 
I 1 
i I 
\ l 
\ i 
A / 
` f 
d 
2147483649 2147 483 648 2147483648 ^ 
U 24-26 [00 000000 32 eid O 
24-26 32 bit Doo 2] 
24.8 tcp init[] |] 
domaininit TCP tcp init ([] 24-27) 




























































































ASS) tep iss] | 






















































































(quite time)" 




















































































































































































































IP 

































































7-23 








Chinaspubecom er 651 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































43 void top subre 
44 tcp init() 
45 í 
46 tep iss = 1; /* wrong */ 
47 tcb.inp next = tcb.inp prev = &tcb; 
48 if (max_protohdr < sizeof(struct tcpiphdr)) 
49 max_protohdr = sizeof (struct tcpiphdr); 
50 if (max_linkhär + sizeof(struct tcpiphdr) > MHLEN) 
51 panic("tcp_init"); š 
= tcp_subr.c 
0 24-27 tcp init JO 
2. TCP Internet PCB 
PCB (tcb)[] previous next tcb PCB 
0( 0) 
PCB inp_lport TCP TCP 
1024 22.4 
3. 
40 max_protohdr 40( 
IP/TCP ) 7-17 max_linkhdr ( 
16)[] 40 mbu (100 2-7 MHLEN) 
MSL 
TCP TCP 
MSL(2 ) TCP TCP 
MSL (maximum segment lifetime) 
MSL 
CLOSE_WAIT 2[] MSL (U 24-15) 
RFC 793(Postel 1981c) MSL 2 Net/3 MSL| 301] ( 
25-3 TCPTV_MSL) 
(RFC 793 (wandering 
duplicate) Net/3 tcp_iss 1(U 24-27) 
25.5 tcp iss 128 000 9.3 
connect[] tcp. iss 64 000 
9.3 
1) 1024 2 



























































































































































































































































65 2 TCP/IP 
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2 
2) 2 
3) 
4) 
5) 40 TCP tcp iss[] I 
6) 
1024 SYN 1 
(incarnation) 
7) 1 u L | | 0 L 
L] E 
24-28 
DD 1-- 000000000000 000000) -------- ga 
2—+— 9090000022 000000000 | 
3+ 900000000000 | 
44 p000000 | 
| 
I 
40! [] | <MSL 
l 
| 
I 
5+ 9000000's9001 | 
6+ 00000000000000 | 
ZIONA esse y 
00 
D 2428 I000000000000000 
TCP ISS ISS 
ISS 
p000000 TCPO MSL 
( ) TCP 
MSL 
249 00 
6 TCP TCP 
TOR TCP |000000000 D 
U U | i 0 i TCP 
TCP TCP 
(TCP ) 32 bit 



































































































































































































































Chi f HIT 1000 653 


O000000000000000000000000000000 TCP 0000 


O 24 TCP[] 



























































000 TCPOOO tcp_initQ D D D Internet PCBO TCP I 00000 
OOO00000000000000 





































































































































































































OU 
24.1 002450 000000000 000000 0000000000 
24.2 tepinit DOO0000 
243 JO netstat -A0000 0 | 100000 TCPO | 






























































China=pubscom, 


0 250 TCPO OOO 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































25.1 DD 
TCP TCP 
TCP 
1)" (connection establishment)” SYN 
75 
2)" (retransmission)” TCP 
TCP (] TCP ) 
TCP 
3)“ ACK(delayed ACK)” TCP 
TCP 200 ms 200 ms 
ACK 
4)“ (persist )” 0 TCP 
( ACK ) TCP 
TCP 
0 1 
5 60 
5)“ (keepalive)” SO_KEEPALIVE 
2 
TCP 2 
TCP TCP 
TCP 
( ) ( 
) 
6) FIN_WAIT 2 FIN WAIT 1 FIN WAIT 2 ( 24-15) 
( close shutdown 
TCP ) FIN WAIT 2 10 75 
FIN 
FIN WAIT 2 
7) TIME WAIT 2MSL| 2MSL MSL[] 24.8 
TIME WAIT 































































































































































































25 TCP 

































































655 






















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































18.6 2MSL TIME_WAIT 
1 (Net/3 30 MSL) TCP Internet PCB 
TCP 200 ms ( ) 500 
ms ( ) ACK 6 
ACK 200 ms ACK (LACK 
0-200 ms ) 500 ms 0 
25.2 [] 00 
TCP[] [] TF_DELACK ([] 24-14) 
ACK TCP t_timer 4] (TCPT NTIMERS) 
6 25-1 6 
ACK 6 
[] U [] [] U 
TCPT_REXMT 0 U U D D 
TCPT_PERSIST| I DU U D D 
TCPT KEEP 2 O000000000000 
TCPT 2MSL 3 2MSL[] [] 0 FIN WAIT 20 0 O 
O 25-1 t timer 0000 
t timer | 500 ms 
16 383.5 4.5 
| go Do jooack} 00 | 00 | FIN | zwet 
000 (00 U D U 000 000 | WAIT 2 
t timer [TCPT REXMT] . 
t_timer [TCPT_PERSIST] . 
t_timer[TCPT_KEEP] . 
t_timer [TCPT_2MSL] 
t_flags & TF_DELACK 
tcp keepidle (20 0) 
tcp_keepintvl (75[] ) 
tcp maxidle (109 0) 
2 * TCPTV MSL (60[] ) 
TCPTV KEEP INIT (75[] ) ° 
[] 25-2 ID TCPOHOOUUO 
25-1 4[] " Ñ 6[] TCP" k 
TCPT_KEEP 
2MSL FIN WAIT 2 TCPT 2MSL 
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TCPTV_REXMTMAX 


OOO L L | 
UU 4 2 (O 25-3) 
2 O I TCP 
200 ms] [D oop [] o 
25-3 Net/3 
[] [] 
TCPTV. MSL [] 00000 
TCPTV. MIN 





TCPTV_PERSMIN 
TCPTV_PERSMAX 





TCPTV_KEEP_INIT 
TCPTV_KEEP_IDLE 
TCPTV_KEEPINTVL 


O000000 emm 
000000000 








TCPTV_SRTTBASE 
TCPTV_SRTTDFLT 














000000 RTTE l 
U D 0 U 
































3 
4 




















= 
C) 
O 
O 
E 


U 253 TOP] D 0 0 D L 























































































































TCP LINGERTIME 


TCP MAXRXTSHIFT 
TCPTV KEEPCNT 









































D SO_LINGER)OODODOD 0 00000 D 
D DUD ACKD D D DD 0 0 
D D 0000 DDD 0000 D 





















































































































































































































































































































































































































































































































































25-50 0 0 0 TCP T. RANGI OD ODO 
OOO 
- tcp_timer.h 
102 #define TCPT_RANGESET (tv, 
103 (tv) = (value); \ 
104 if ((tv) < (tvmin)) 
105 (tv) (tvmin); \ 
106 else if ((tv) 
107 (tv) (tvmax); 
108 ) 2 
tcp timer.h 
25-3 0 OM 
25-4 (linger timer) |] 
SO LINGER close (15.15 
30-12[] [] | | 
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25.3 tcp canceltimers||[| 































































































































































































































































































































































































25-6 tcp canceltimers TIME WAIT tcp input 
2MSL 4 
FIN. WAIT 2 
— BOD HHE C 
107 void TE 


108 tcp canceltimers (tp) 
109 struct tcpcb *tp; 





















































































































































































































































































































































































































































































































































































































































110 ( 

111 int i; 

112 for (i = 0; i « TCPT NTIMERS; i++) 

113 tp-»t timer[i] = 0; 

114 : 
på) ee aep timere 

U 25-6 tcp canceltimers [0 
25.4 tcp fasttimo[|[| 
25-7 tcp fasttimo 200 ms[] pr. fasttimo 
ACK 

A A q LCH timer o 

41 void ii 

42 tcp fasttimo() 

43 ( 

44 struct inpcb *inp; 

45 struct tcpcb *tp; 

46 int s = splnet (); 

47 inp = tcb.inp_next; 

48 if (inp) : 

49 for (; inp != &tcb; inp = inp-»inp next) 

50 if ((tp = (struct tcpcb +) inp-»inp ppcb) && 

51 (tp->t flags & TF DELACK)) ( 

52 tp->t flags &= "TF_DELACK; 

53 tp->t flags |- TF ACKNOW; 

54 tcpstat.tcps delack++; x i 

55 (void) tcp output (tp); 

56 3 

57 splx(s); 

58 å 
DE n EH timere 

[] 25-7 tcp fasttim JO 0 0O 200 ms] 000 
TCP TCP Internet PCB TCP_DELACK 
TF_ACKNOW tep_output TF_ACKNOW 
ACK 
TCP[] PCB Internet PCB TCP ([] 50 ) 
30-11 (PRU_ATTACH socket ) 
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Inertnet PCB TCP (U 1-13) 
tcp_fasttimo 
25.5 tcp slowtimo[|[| 
25-8 tcp slowtimo 500ms[] pr. slowtimo 
6 FIN. WAIT 2 
2MSL 
=== 
64 void ke 
65 tcp slowtimo() 
66 ( 
67 struct inpcb *ip, *ipnxt; 
68 struct tcpcb *tp; 
69 int S = splnet (); 
70 int i; 
71 tcp maxidle = TCPTV KEEPCNT * tcp keepintvl; 
72 få 
73 * Search through tcb's and update active timers. 
74 */ 
75 ip = tcb.inp_next; 
76 if (ip == 0) ( 
77 splx(s); 
78 return; 
79 } : 
80 for (; ip != &tcb; ip = ipnzt) ( 
81 ipnxt = ip->inp_next; 
82 tp = intotcpcb (ip); 
83 if (tp == 0) 
84 continue; 
85 for li = 0; i < TCPT_NTIMERS; i++) { 
86 if (tp-»t timer[i] && --tp->t_timer[i] == 0) L 
87 (void) tcp usrreq(tp-»t, inpcb-»inp. socket, 
88 PRU. SLOWTIMO, (struct mbuf *) O, 
89 (struct mbuf *) i, (struct mbuf *) 0); 
90 if (ipnxt-»inp prev != ip) 
91 goto tpgone; 
92 } 
93 } 
94 tp->t_idle++; 
95 if (tp-»t rtt) 
96 tp->t rtt++; 
97 tpgone: 
98 ; 
99 } 
100 tcp iss += TCP_ISSINCR / PR SLOWHZ; /* increment iss */ 
101 tcp now++; /* for timestamps */ 
102 splx(s); 
103 ) . 
A te timer.c 
[] 25-8 tcp slowtim JO D OG 500 ms] [0 Ü 
71 tcp_maxidle 10 TCP 
25-6 FIN_WAIT_2 













































































































































































































































































tcp_init ( 25.2) 
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1 TCP 
72-89 TCP TCP Internet PCB 
0 1 0 PRU_SLOWTIMO 
tcp_timers 
tcp_usrreg mbu mbuf 
tcp_slowtimo i 
i mbu 
2. TCP 
90-93 Internet PCB[] ipnxt 
PRU SLOWTIMO tcp_slowtimo TCP PCB 
PCB == 2MSL 
TCP c — tpgone 
PCB 
3 
94 tcp input t idle 
500ms t idle (1)TCP 
2 | (2) FIN WAIT 2 10 
75 TCP (3) tcp output 
4 RTT 
95-96 RTT[] tcp output t rtt 
1 500 ms tcp_slowtimo 
t_rtt t_rtt 
5. 
100 tcp iss[]tcp init 1 500 ms tcp iss 64 000: 128 000 
(TCP_ISSINCR) 2 (PR SLOWHZ) tcp iss 
8 1 
tcp iss 64 000 
RFC 793 4 250 000 Net/3 
6. RFC 1323 
101 tcp now 0 500 ms RFC 1323 
[Jacobson, Barden) Borman 1992][] 26.6 
75-79 (tcb.inp next ) tcp. iss 
tcp now UNIX 
TCP 
25.6 tcp timers[|[] 
tcp timers 4[] TCP 0 TCP[] PRU. SLOWTIMO 






















































































































































































(U 30-10) 





















































660 roman n: Chibaspuf tot 
—— nu] 


case PRU_SLOWTIMO: 
tp = tcp_timers(tp, (int)nam); 






















































































switch case 25-9 




















































































































tcp_timer.c 


120 struct tcpcb * 
121 tcp_timers (tp, timer) 
122 struct tcpcb *tp; 


123 int timer; 

124 { 

125 int rexmt; 
126 switch (timer) (I 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































256 } 
257 return (tp); 
258 ) ; 
tcp timer.c 
0 25-9 tcp timers [000000 
3 (SU TCP ) 25.11 
25.6.1 FIN WAIT 20 2MSL 
TCP[] TCP2 2MSL 
1) FIN WAIT 2 tcp input[] FIN WAIT 1 FIN WAIT 2 
( close shutdown 
TCP ) FIN WAIT 2 10 (tcp_maxidle) 
FIN WAIT 2 
2) 2MSL TCP TIME WAIT 2MSL 60 
25-10 2MSL case — 0 
tcp timer.c 
127 /* P- 
128 * 2 MSL timeout in shutdown went off. If we're closed but 
129 * still waiting for peer to close and connection has been idle 
130 * too long, or if 2MSL time is up from TIME_WAIT, delete connection 
131 * control block. Otherwise, check again in a bit. 
132 */ 
133 case TCPT 2MSL: 
134 if (tp-»t state !- TCPS TIME WAIT && 
135 tp->t idle «- tcp maxidle) 
136 tp->t timer[TCPT 2MSL] = tcp keepintvl; 
137 else 
138 tp = tcp. close(tp); 
139: break; I 
tcp_timer.c 
[] 25-10 tcp timers [I [N 2MSLO OOOO 
1. 2MSL 
127-139 25-10 TCPT 2MSL 







































































































































































































































































( 25.4) TIME WAIT 60 tcp close 
























































25 








TCP 










































































661 











































































































































































































































































































































































































































































































































































































































































































































































































25-11 | | | 2MSL 
| (2X ) | 
0-500 ms | 2X N- 1] 2x NJ O g 
1191 000 x 500ms[]  =59.5[ 

I — — "M 

ESCH Gees t 
: Don an DD O 500 ms prslowtimo () 

" DO 
| i i : U ia E () 

tcp usrreq(PRU SLOWTIMO) 
DO 
tcp_timers (TCPT_2MSL) 
DO 
tcp close() 
O 25-11 TIME WAIT[] [| [| 2MSL 00000000 
2. FIN WAIT 2 
127-139 TIME WAIT[] TCPT 2MSL FIN WAIT 2 
10 (tcp_maxidle) 
100 0 0 FIN WAIT 20000000 750 25-2000 000 0 
12000 0 1500 0 
08 > _—_—__——_ gj Il 
(00 0) (750) 


y 


OO FIN WAIT 20 0 
FIN WAIT 20 00000 
1200(tcp maxidle); 


' 


FIN WAIT 200000 
t_idle=1198; 


FIN WAIT 200000 


i 


FIN_WAIT_20 0000 
t_idle=1198+150; 
tcp_close() 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































t_idle=0 H 150 (tcp_keepintvl) 
0 25-12 FIN WAIT 200000000000 FIN WAIT 20 0 
ACK FIN WAIT 1 FIN WAIT 2 (U 24-15)|]] t idle 
OT FIN WAIT 2 O 1200(tcp_maxidle) 25-12 0 10 [| 
0-500 ms 1199 
25-8 t idle 
t idle 1198( 10 ) " ]198 
1200" FIN. WAIT 2 150 (tcp. keepintvl) 75 
t idle 1348 tcp close 
10 O 75 0 LU 100 U LU 
FIN WAIT 2 [] 10 | t idle 
75 
ACK FIN WAIT 1 FIN WAIT 2| 
10 ( t idle 0) 



































662 zen 0: China-pub.con 
TET san! 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































FIN WAIT 2 10 
FIN WAIT 2 close 
FIN TCP| close 
TCP FIN WAIT 2 
25.6.2 
25-13 case 
=== LCH timer.c 
210 ja 
211 * Persistence timer into zero window. 
212 * Force a byte to be output, if possible. 
213 * 
214 case TCPT_PERSIST: 
215 tcpstat.tcps persisttimeo++; 
216 tcp setpersist (tp); 
217 tp->t force = 1; 
218 (void) tcp output (tp); 
219 tp->t_force = 0; 
20 breaks en fimerc 
0 25-13 top timers 2000000000 
210-220 o[] TCP 
tcp setpersist TCPT PERSIST 
t force tcp output 1 
25-14 | 1.50 ( 
22-1) 
psupuA. 36 A ja PH o 
0 51016 28 52 100 f 160 220 
025-14 OI0O000000000000000000 
60 TCP 60 | LU 
5 60 | 5 1.5 3 
2[] 25.9 
25.6.3 
TCP[] TCPT KEEP 
1) connect SYN SENT ( ) 
LISTEN SYN RCVD ( ) SYN 
750) (TCPTV KEEP INIT) 75 ESTABLISHED 
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(tcp_keepidle) t_idle TCP 
( 2 ) 
TCP 
TCP 2 
25-15 TCP[] TCPT KEEP case 
tcp_timer.c 
221 ZS cP- 
222 * Keep-alive timer went off; send something 
223 * or drop connection if idle for too long. 
224 */ 
225 case TCPT KEEP: 
226 tcpstat.tcps, keeptimeo-*; 
227 if (tp->t state « TCPS ESTABLISHED) 
228 goto dropit; /* connection establishment timer */ 
229 if (tp-»t inpcb-»inp socket->so options & SO KEEPALIVE && 
230 tp->t state <= TCPS CLOSE WAIT) { 
231 if (tp-»t idle >= tcp keepidle + tcp maxidle) 
232 goto dropit; 
233 /* 
234 * Send a packet designed to force a response 
235 * if the peer is up and reachable: 
236 * either an ACK if the connection is still alive, 
237 * or an RST if the peer has closed the connection 
238 * due to timeout or reboot. 
239 * Using sequence number tp->snd_una-1 
240 * causes the transmitted zero-length segment 
241 * to lie outside the receive window; 
242 * by the protocol spec, this requires the 
243 * correspondent TCP to respond. 
244 */ 
245 tcpstat .tcps_keepprobe++; 
246 tep_respond(tp, tp->t_template, (struct mbuf *) NULL, 
247 tp->rcv_nxt, tp->snd una - 1, 0); 
248 tp-»t timer [TCPT KEEP] = tcp_keepintvl; 
249 ) else 
250 tp->t timer [TCPT KEEP] = tcp keepidle; 
251 break; 
252 dropit: 
253 tcpstat.tcps keepdrops++; 
254 tp = tcp drop(tp, ETIMEDOUT); 
255 break; 2 
- tcp_timer.c 
U 25-15 tcp timer [][] LU U D DD UI LI LI I 
1. 75 
221-228 ESTABLISHED([] 24-16)|]] TCPT KEEP 
dropit tcp_drop ETIMEDOUT 
ETIMEDOUT — ICMP 
EHOSTUNREACH 
30-4 TCP SYN 
75 SYN 25-16 


























































































































































































































664 





TCP/IP 
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00 00 DO tcp_drop () 
SYN SYN SYN 
0 25-16 SYNTIDO00000000000000 
6 O (U 25-19) 24 48 25.7 
SYN 0 6 30 
LU 750 3 LU LU 
tcp_drop 
2. 2 
229-230 2 
SO_KEEPALIVE ESTABLISHED 
CLOSE_WAIT ( 24-15)[] TCP close( 
CLOSE_WAIT) 2 TCP 
3. 
231-232 u 2 (tcp_keepidle) 10 
(tcp. maxidle)[|l] TCP 9 
750 (tcp_keepintvl)[] TCP 
ACK TCP 
4. 
233-248 [] TCP Uu UUU top responda 0 0 
(tcp respond ) rcv nxt 
snd una -1 (O 24-17) 
ACK 
25-17 
— 200 75 75 75 75 75 75, 75 75 , 75 
4 («Bu 0 75 150 225 300 375 450 525 600 675 
geen (tr) (Ai) 
OO OO OO 00 00 ag 00 Od OO 
1 2 3 4 3 6 7 8 9 
tcp. drop() 
02517 HDDUDUDUDUDUDDDDDDUDUID 
0 75 9 600 675 ( 2 
11.25 ) TCPTV. KEEPCNT([] 25-4) 8 





















































































































































25 TCP 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































9 
0 t idle([] 25-8) 
tcp input 3 
14400(tcp keepidle) t idle 3 
tcp slowtimo 14339[] t. idle 1 x 
2 1 0 tcp_timers 6 
t idle 143390 0 25-18 å 
tcp timers||t idle 9 
25-15 t idle 15600 
(tcp. keepidle+tcp maxidle) O 25-18 [][] tcp timers DO DD 
25-170 0 675 9 0000 tide 000 
5. 
249-250 CLOSE_WAIT 
2 (tcp_keepidle) 
tcp keepdrops(253[] ) TCPT KEEP 






























































































































































































































































25.7 I0000000 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































| ACK 200ms 75 
2 = = 
RTT RTT 
TCP 
ACK TCP 
( ACK ) 
| 
Net/3[] TCP (RTO) (nticks) 
RTT (srtt) RTT (rttvar) 
[Jacobson 1988b] RTT 
delta=nticks -srtt 
Srtt« srtt+gX delta 
rttvare rttvar+h(|delta| -rttvar) 
RTO=srtt+4X rttvar 
delta (nticks) RTT (srtt) g RTT 
1/81] h 1/4 RTO 
4 2 









































































































































































































































666 
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TCP/IP 4.2 
[Jacobson 1988b]| RTO | [| 2X rttvar| | [Jacobson 
1990d] 4X rttvar Net/1 
TCP uu TCP 
25-19 
tcpcbl] [] [] [] tcp newtcpcb | ] LH [] O 
UU 
t srtt xs 0 0000 ert) O00 srttX 8 
t_rttvar [|] x4 24 3 OOOO rstrOOOOOOOD rttvarX 4 
t_rxtcur Od 12 6 DD U U 000 aro 
t_rttmin Od 2 a OO0O0O0O000 
t rxtshift (T 0 tep_backoff[ 02000 (0000) 
025-19 11 DD UD DB 00000000 
tcp_backoff 25.9 tcp newtcpcb | 
U | t rxtshift shift 
TCP MAXRXTSHIFT 25-19 
TCP RTT RTT 
(t. rtt[] t rttvar)] C 0 | U 
(scaled) srtt[] rttvar 
t_srttl]t_rttvar TCP 
25-20 t_srtt t_rttvar 
8[] 4 
U U [] U U 
TCP RTT SCALE 8 OO0 t_srtt=srttx 8 
TCP_RTT_SHIFT 3 OO 0 t_srtt=srtt<<3 
TCP_RTTVAR_SCALE 4 O00 t_rttvar=rttvarx 4 
TCP_RTTVAR_SHIFT 2 OM D t_rttvar=rttvar<<2 

















0 25-20 RTTIUDUUDUDUDOD 


25.8 tcp newtcpcb[|[] 





























































































































































































































































































































































































































25-21 tcp newtcpcb TCP 
TCP[] PRU, ATTACH 30-2) Internet 
PCB inp 
TCP 
167-175 malloc bzero 
176 seg_next|| seg_prev | 
27.90 [] O g 
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tcp_subr.c 
167 struct tcpcb * 
168 tcp_newtcpcb (inp) 
169 struct inpcb *inp; 
170 { 
171 struct tcpcb *tp; 
172 tp = malloc (sizeof (ftp), M PCB, M NOWAIT); 
173 if (tp == NULL) 
174 return ((struct tcpcb +) 0); 
175 bzero( (char zi tp, sizeof (struct tcpcb)); 
176 tp->seg next = tp->seg_prev = (struct tcpiphdr *) tp; 
177 tp->t_maxseg = tcp mssdflt; s 
178 tp->t flags = tcp do rfc1323 ? (TF REQ SCALE | TF REO TSTMP) : 0; 
179 tp-»t inpcb = inp; 
180 /* 
181 * Init srtt to TCPTV SRTTBASE (0), so we can tell that we have no 
182 * rtt estimate. Set rttvar so that srtt « 2 * rttvar gives 
183 * reasonable initial retransmit time. 
184 */ 
185 tp->t_srtt = TCPTV_SRTTBASE; 
186 tp->t_rttvar = tcp rttdflt * PR SLOWHZ << 2; 
187 tp->t_rttmin = TCPTV MIN; : 
188 TCPT_RANGESET (tp->t_rxtcur, 
189 ((TCPTV_SRTTBASE >> 2) + (TCPTV SRTTDFLT << 2)) >> 1, 
190 TCPTV MIN, TCPTV REXMTMAX); 
191 tp->snd_cwnd = TCP MAXWIN << TCP. MAX WINSHIFT; 
192 tp-»snd ssthresh - TCP MAXWIN «« TCP MAX WINSHIFT; 
193 inp-»inp ip.ip ttl = ip defttl; 
194 inp->inp_ppcb = (caddr t) tp; 
195 return (tp); 
196 3 
tcp. subr.c 
U 25-21 tcp newtetd 000000000000 TCP[J 0 O 
177-179 t maxseq 512(tcp_mssdflt) 
MSS tcp_mss ( TCP MSS ) 
RFC 1313 ([] 24-3 
top do rfct313 D[] TF. REQ SCALE[] TF REQ TSTMP 
TCP t inpcb Internet PCB 
180-185 25-19 t srtt[]t. rttvar[] t. rttmin 
t rxtcur RTT O(TCPTV SRTTBASE) 
RTT RTT tcp xmit timer 
RTT 0 
186-187 RTT t rttvar 24[] 3t cp. rttdflt 24-3) 
2(PR SLOWHZ) 2 bit( 4) t rttvar rttvar|] 4 6 
3 RTO t rttmin 2 
188-190 t rxtcu RTO 2 
(TCPTV MIN) 128 (TCPTV REXMTMAX)[] TCPT RANGESET 
12 6 RTO 
C RTT 
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China-pub.tol 















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
RTO 2 4 
RTO=srtt+2X rttvar 
2 4 4.3BSD Tahoe [Paxson 1994] 
t srtt=8X srtt 
t rttvar=4X rttvar 
t srt ' 
Roy trttvar q EE 
= === x —— = 
8 4 2 
25-21 TCPT_RANGESET — 6 
TCPTV SRTTDFLT[] A[] ( ) t rttvar 
191-192 (snd cwnd) (snd ssthresh) 1073 725 440 ( 
1 GUU) TCP | (O 1[] 21.6 
) TCP| (65535[] TCP MAXWIN) 2"[] 14 
(TCP MAX WINSHIFT) SYN 
tcp mss snd cwndl] 1 
193-194 Internet PCB IP TTL 64(ip defttl) PCB 
TCP 0 
t_rxtshift 0 
bzero | 
25.9 tcp setpersist[|[] 
tcp setpersist TCP 25-13 
TCP 
0 25-22 
493 void tcp. output.c 
494 tcp setpersist(tp) 
495 struct tcpcb *tp; 
496 I 
497 t = ((tp->t srtt >> 2) + tp-»t rttvar) >> 1; 
498 if (tp->t timer [TCPT REXMT]) 
499 panic("tcp output REXMT"); 
500 FE 
501 * Start/restart persistance timer. 
502 */ 
503 TCPT_RANGESET (tp->t_timer [TCPT_PERSIST], 
504 E > tcp backoff[tp-»t rxtshift], 
505 TCPTV PERSMIN, TCPTV PERSMAX); 
506 if (tp->t rxtshift « TCP MAXRXTSHIFT) 
507 tp->t rxtshift++; 
508 3 
tep output.c 





[] 25-22 top setpersist 


ODO0O0000000000000000 
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1. | 
493-499 |] | | | | 
U U U U U 0 
OOOOOOD 
2. RTO 
500-505 RTO t 
RTO=srtt+2X rttvar 
U U U U U U U U 
— +t_rttvar 
RTO = —À 
2 
t u 
3. Huit 
506-507 RTO 0 O RTO) tcp. backoff 
int tcp_backoff[ TCP_MAXRXTSHIFT + 1] = 








(1, 2j 























tcp. output] 


































































































tp->t rxtshift=0; 
tcp_setpersist (tp); 














































































































































































































| tcp_setpersist t_rxtshift= 0 tcp_backoff[0]=1 
t[] TCPT. RANGESET[] [| RTO[] 50 ~60| t_rxtshift 
1 12(TCP. MAXRXTSHIFT)[] tcp. backoff[12] | 

























































































25.10 tcp xmit timer[|[| 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































tcp xmit timer RTT 
RTT (srtt) (rttvar) 
rtt RTT nticks+1 ([] 25.7 ) 0 
RTT (tcp now) 
E O O 26.6 tcp. now[] 500ms[] [J ([] 25-8) 
00000 Cep now III ACK 
| 25-8 t rtt[] 500 
ms 25.5 | 1 ACK 
RTT 1( ) 
tcp_input|| [| [| tep xnit timer] || UU 
































if (ts_present) 


























tcp_xmit_timer (tp, tcp_now - ts_ecr + 1); 


oO 


lse if (tp->rtt && SEQ GT(ti->ti ack, tp->t_rtseq) ) 
tcp_xmit_timer (tp, tp->t_rtt); 

















































































































(ts_present)[] RTT O (tcp now) 
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(ts_ecr) 1[] RTT ( 1 ) 
ACK 
RTT TCP (t_rtt) RTT 
t_rtseg 
ACK ACK (ti ack) 
(t. rtseq)[] t. rtt RTT RTT 
RFC 1323 t rtt[] TCP RTT 
([] 25-8) Eu 0 
tcp_slowtimo 500ms t_rtt 1 t_rtt 
1 tcp_xmit_timer 1 
tcp_xmit_timer 
ACK TCP 1-1024 
(t_rtseq 1) ( ) 1025-2048 
ACK ti_ack 2049 1-2048 
RFC 1323 
(ts_ecr) RTT 
25-23 RTT 
TITO —Ó — GEGEN input.c 


1311 tcp xmit timer(tp, rtt) 
1312 struct tcpcb *tp; 
1313 short rtt; 


1314 ( 
1315 


1316 
1317 
1318 
1319 
1320 
1321 
1322 
1323 
1324 
1325 
1326 
1327 
1328 
1329 
1330 
1331 
1332 
1333 
1334 
1335 
1336 
1337 


Short delta; 


tcpstat .tcps_rttupdated++; 


if (tp-»t srtt != 0) 
/* 


{ 


* srtt is stored as fixed point with 3 bits after the 
i.e., scaled by 8). The following magic 


binary point ( 


* + + + X 


/ 


delta = rtt - 1 - 


tp->t_srtt = 


smoothed mean 


binary point ( 


+ GRE 


/ 
0 25-23 tcp xmit timer 


(tp->t srtt >> TOP RTT SHIFT); 
if ((tp->t_srtt += delta) <= 0) 


1; 


We accumulate a smoothed rtt variance (actually, a 


difference), then set the retransmit 


scaled by 4). The following is 


equivalent to rfc793 smoothing with an alpha of .75 
(rttvar = rttvar*3/4 + Ideltal / 4). This replaces 
rfc793's wired-in beta. 


is equivalent to the smoothing algorithm in rfc793 with 
an alpha of .875 (srtt = rtt/8 + srtt*7/8 in fixed 
point). Adjust rtt to origin 0. 


timer to smoothed rtt + 4 times the smoothed variance. 
rttvar is stored as fixed point with 2 bits after the 


OOOO000RTIOOOOOOOOORTIIDOD 
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1338 if (delta < 0) 
1339 delta = -delta; s 
1340 delta -- (tp-»t rttvar »» TCP RTTVAR SHIFT); 
1341 if ((tp-»t rttvar «- delta) «- 0) 
1342 tp-»t rttvar = 1; 
1343 ) else ( 
1344 /* 
1345 * No rtt measurement yet - use the unsmoothed rtt. 
1346 * Set the variance to half the rtt (so our first 
1347 * retransmit happens at 3*rtt). 
1348 */ 
1349 tp->t_srtt = rtt << TCP_RTT_SHIFT; 
1350 ` tp->t_rttvar = rtt << (TCP RTTVAR SHIFT - 1); 
1351 i É 
Be EEE EE s I tcp_input.c 
H 25-23 (0) 
1. RTT 
1310-1325 tcp_newtcpcb RTT (t. srtt)[] 0 
RTT delta[] RTT RTT 
t srtt 8 
1326-1327 [] O RTT] L N] 
srtt€- srit+gX delta 
g=1/8 









































8X srtt€- 8X srtt+ delta 


























t srttet srtt+delta 
1328-1342 RTT L | | 


rttvare rttvar+h(| delta|- rttvar) 
































































































































































































































































































































































































































































































































































































































h=1/4 t_rttvar=4X rttvar | 

t.rttvar 

t rttvar t rttvar |delta | - 

4 “a * 4 

t_rttvar 

t_rttvar<t_rttvar+ |delta | === 

C 

2 RTT 
1343-1350 RTT | [] RTT | L 
| rtt rtt O O RTT[] [| 1(nticks+ DP] [] 
delta rtt 1 


































































































srtt=nticks+1 














t srtt 


8 = nticks +1 


672 
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TCP/IP 2 









































t_srtt=(nticks+1)X 8 























































































































































































































































































































































































































































































































O | RTT | 
srtt 
rttvar = — 
2 
t rttvar _ nticks+1 
4 2 
t rttvar=(nticks+l)X 2 
RTO 3X srtt 
RTO=srtt+4X rttvar 
rttvar 
srtt 
OSA 
RTO=3X srtt 
25-24 tcp_xmit_timer 
tcp input.c 
1352 tp-»t rtt - 0; PT 
1353 tp->t rxtshift = 0; 
1354 /* 
1355 * the retransmit should happen at rtt + 4 * rttvar. 
1356 * Because of the way we do the smoothing, srtt and rttvar 
1357 * will each average +1/2 tick of bias. When we compute 
1358 * the retransmit timer, we want 1/2 tick of rounding and 
` 1359 * 1 extra tick because of +-1/2 tick uncertainty in the 
1360 * firing of the timer. The bias will give us exactly the 
1361 * 1.5 tick we need. But, because the bias is 
1362 * statistical, we have to test that we don't drop below 
1363 * the minimum feasible timer (which is 2 ticks). 
1364 */ : 
1365 TCPT_RANGESET (tp->t_rxtcur, TCP REXMTVAL(tp), 
1366 tp->t_rttmin, TCPTV REXMTMAX) ; 
1367 ZS 
1368 * We received an ack for a packet that wasn't retransmitted; 
1369 * it is probably safe to discard any error indications we've 
1370 * received recently. This isn't quite right, but close enough 
1371 * for now (a route might have failed after we sent a segment, 
1372 * and the return path might not be symmetrical). 
1373 */ 
1374 tp->t_softerror = 0; 
1375 } 





1352-1353 RIT (t_rtt) (t rxtshift) 0 


tcp input.c 
D 25-24 tcp mit tier 00000000 























































































































































































































29 














TCP 
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1354-1366 









































#define TCP REXMIVAL(tp) \ 
(((tp)->t_srtt >> TCP_RTT_SHIFT) + (tp)->t ttvar) 























RTO(t_rxtcur) | 

































































U U U U U 















































tcp_xmit_timer 


RTO=srtt+4X rttvar 











































































































srtt| | rttvar 




































































































































































































































































































































































RTO(t_rttmin 


tcp_xmit_timer 



































t srtt t rttvar Lt srtt 
RTO = +4 X — = +t_rttvar 
4 8 
RTO 
t_newtcpcb 2 ) 128 (TCPTV_REXMTMAX) 
3. 

1367-1374 | 

(t softerror) 








































































































































































































25.11 [I ÅD tcp_timers][] |] 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































tcp timers 25.6 case 
RTO 
25-25 tcp output 1.5 
LAN ( 1 21-1) 
24 48 64 64 64 64 64 64 | 64] | 

| 746.5 YA 94.5 158.5 222.5 286.5 350.5 414.5 478.5 542.5 
| © ~~~) (7) (8) (9) (10) (11) (12) (13) 
l PUE 
Bech? tcp drop() 
15, 3 6 120 ~~ 
015 45 10.5 22.5 

(0 Q (3) (€ t rxtshift[] U Ü 

[] 25-25 00O0000000000 
x UT 1.5[] 4.5 
t rxtshift 12 | O 542.50 ([] 9 )] TCP 
RFC 793 
TCP TCP 
5 
RFC 1122 TCP 
TCP “ ý TCP 
Net/3 TCP 
(12) RTT 
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TCP/IP 2 
25-26 case 
tcp_timer.c 
140 /* P- 
141 * Retransmission timer went off. Message has not 
142 * been acked within retransmit interval. Back off 
143 * to a longer retransmit interval and retransmit one segment. 
144 */ 1 
145 case TCPT_REXMT: 
146 if (++tp->t_rxtshift > TCP_MAXRXTSHIFT) { 
147 tp->t_rxtshift = TCP_MAXRXTSHIFT; 
148 tepstat.tcps_timeoutdrop++; 
149 tp = tep_drop(tp, tp->t_softerror ? 
150 tp->t_softerror : ETIMEDOUT) ; 
151 break; 
152 ) 
153 tepstat.tcps_rexmttimeo++; 
154 rexmt = TCP REXMTVAL(tp) * tcp_backoff [tp->t_rxtshift]; 
155 TCPT_RANGESET (tp->t_rxtcur, rexmt, 
156 tp->t_rttmin, TCPTV REXMTMAX); 
157 tp->t timer [TCPT REXMT] = tp->t_rxtcur; 
158 få 
159 * If losing, let the lower level know and try for 
160 * a better route. Also, if we backed off this far, 
161 * our srtt estimate is probably bogus.  Clobber it 
162 * go we'll take the next rtt measurement as our srtt; 
163 * move the current srtt into rttvar to keep the current 
164 * retransmit times until then. 
165 Wi 
166 if (tp->t_rxtshift > TCP_MAXRXTSHIFT / 4) { 
167 in losing(tp-»t inpcb); 
168 tp->t_rttvar += (tp->t_srtt >> TCP RTT SHIFT); 
169 tp-»t srtt = 0; 
170 } 
171 tp->snd_nxt = tp->snd_una; 
172 /* 
173 * If timing a segment in this window, stop the timer. 
174 */ 
175 tp-»t rtt = 0; š 
tcp timer.c 
D 25-26 tcp timers J[J0000000000000 
1. 
146 (t rxtshift) 12(TCP MAXRXTSHIFT) 
25-25 t rxtshift 
TCP 
ETIMEDOUT 
2: 
147-152 TCP 
TCP TCP SYN 
TCP ETIMEDOUT 
ICMP" " tcp notify t softerror 
TCP EHOSTUNREACH 














































































































































































































25 TCP 675 




































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ETIMEDOUT TCP SYN RST 
ECONNRFUSED([] 28-18) 
3. RTO 
153-157 TCP_REXMTVAL RTO 
t_rxtshift 1 RTO TCP_REXMTVAL RTO 
t rxtcur — t timer [TCPT REXMT] — 
tcp input ([] 28-12 29-6) 
4. [] IP 
158-167 4 in losing ( ) 
tcp output ([] 25-27[] case ) 
25-25 22.5 
in losing 
5. RTT 
168-170 RTT (t_srtt) O(t_newtcpcb 
0) tcp_xmit_timer RTT RTT 
4 TCP RTT 
case TCP_REXMTVAL RTO t SEE 0 
([] 25-28 42.464 
) 
RTO 
RTO =- == +t_rttvar 
t_srtt OL] RTO (U 25-28 84.064 
217.84[] )[] case t srtt O[] t rttvar 
6. 
171 (snd nxt) (snd, una) 24-17 
snd nxt snd una snd nxt 
7. Karn 
172-175 RTT t. rtt OL] Karn 
ACK 
[Karn and Partridge 1987] 1[] 21.3 TCP 
t rtt RTT 29-6 
RFC 1323 Karn 
25. 11.1 
25-27 case 
TCP 
TCP 
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11] 20.6 21.6 
176-205 win ( snd_wnd 
snd_cwnd ) ( t_maxseg) 
2 
t_ssthresh( t maxseq) snd cwnd 
4.3BSD[] Net/1 
(win) 
206 ACK| t dupacks ( 29.4 0 
29 TCP 
208 tcp output 
"m T tep timer.c 
177 * Close the congestion window down to one segment 
178 * (we'll open it by one segment for each ack we get). 
179 * Since we probably have a window's worth of unacked 
180 * data accumulated, this "slow start" keeps us from 
181 * dumping all that data as back-to-back packets (which 
182 * might overwhelm an intermediate gateway). 
183 * 
184 * There are two phases to the opening: Initially we 
185 * open by one mss on each ack. This makes the window 
186 * size increase exponentially with time. If the 
187 * window is larger than the path can handle, this 
188 * exponential growth results in dropped packet (s) 
189 * almost immediately. To get more time between 
190 * drops but still "push" the network to take advantage 
191 * of improving conditions, we switch from exponential 
192 * to linear window opening at some threshhold size. 
193 * For a threshhold, we use half the current window 
194 * size, truncated to a multiple of the mss. 
195 * 
196 * (the minimum cwnd that will give us exponential 
197 * growth is 2 mss. We don't allow the threshhold 
198 * to go below this.) 
199 */ 
200 t a 
201 u int win = min(tp->snd wnd, tp->snd cwnd) / 2 / tp->t maxseg; 
202 if (win < 2) 
203 win = 2; 
204 tp->snd_cwnd = tp->t_maxseg; 
205 tp->snd_ssthresh = win * tp->t_maxseg; 
206 tp->t_dupacks = 0; | 
207 ) 
208 (void) tcp_output (tp); 
209 break; 





0 25-27 tcp timer J)J0000000000000 





tcp_timer.c 
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25.11.2 

TCP RTT[] 500 ms[] [] 

RTT | ( 814 
LAN[] RTT RTT 60ms RTT 
[Brakmo, O'Malley, and Peterson 1994] TCP RTT 
( 500 ms ) 

ACK RTT 

Net/3 (26.6[] ) RTT Net/3 

500 ms 
































25.12 IO RTT T 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































bsdi 
vangogh.cs.berkeley.edu 12288 
PPP | TCP | 
sock ( 1 C) -D SO DEBUG (27.10 > 
trpt (8) TCP 
25-28 MIN M-N- 1 
512 | “ ACK M” ACK[] M 
“ (ms)” RTT rte ( 
T tcp_xmit_timer RTT 
1 
tcp_newtcpcb t srtt[]t rttvar[]t rxtcur 0.0 
SYN 365 ms ACK| tcp xmit timer 
rtt 2 RTT (t. srtt-0) 25-23 else 
RTT 
1-512 1.259 ACK[] RTT 
| 1.260 513-1024 
1025-1526 2.206 
ACK RTT ACK 
(513) 
2.206 1537-2048 3.132 ACK 
RTT 
3.132 5 (t_rxtcur ) 
sun[] netb PPP 6.064 
25-26 RTT t rxtshift[] 0 1[] t rxtcur 10 ( 


































































































































































































678 us 0: China+pub.tom 
TE nn! 









































































































































) (and unaz3073)[] 5 































































































t rxtshift 





















































1.260 513:1025 on 
1261 1025:1537 












ack 1537 








946 3 16 4 6 


1537:2049 
2049:2561 
2.209 2561:3073 


3.132 ack 2049 off 926 3 16 3 5 
3.132 3073:3585 on 

3.133 3585:4097 

3.736 ack 2561 i 

3.736 | 4097:4609 


3.737 | 4609:5121 

























































































3.739 ack 3073 
3.739 5121:5633 
3.740 5633:6145 
6.064 3073:3585 off 16 3 1 
11.264 3073:3585 off 16 3 2 
21.664 3073:3585 off 16 3 3 
42.464 3073:3585 off - 0 5 4 
84.064 3073:3585 off 0 5 5 
150.624 3073:3585 off 0 5 6 
217.184 3073:3585 off 0 5 7 
217.944 ack 6145 
217.944 6145:6657 on 
217.945 6657:7169 ; 
218.834 ack 6657 off 890 3 24 6 9 
218.834 7169:7681 on 
218.836 7681:8193 
219.209 ack 7169 
219.209 8193:8705 
219.760 ack 7681 22 7 9 
219.760 8705:9217 
220.103 ack 8705 
220.103 9217:9729 





220.105 9729:10241 


220.106 | 10241:10753 i 
220.821 ack 9217 off 1061 
220.821 | 10753:11265 on 
221.310 ack 9729 
221.310 | 11265:11777 


221.312 ack 10241 
221.312 | 11777:12289 
221.674 
221.955 









22. 6 8 




























ack 10753 
ack 11265 

























[2528 DOOORTTO 000000 




















42.464 t_srtt t_rttvar 5 25-26 





































































































































































































t_rxtcur ( 160) 
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t_srtt 0 RTT (218.834[] ) 
RTT RTT 
| 0 RTT 
25.15 OU 
200 ms[] 500 ms tcp_fasttimo tcp_slowtimo 
| TCP i 
TCP 7 
° ACK 
* FIN WAIT 2 
* 2MSL 
ACK 6 TCP200 ms 
ACK 6 TCP 500 ms 
1 0 TCP 
DO! 4 
6 
0 TCP D RTT 
RTT (srtt) RTT (rttvar)|] | 
( ) U 
U U 
25.1 TCP ( 24-5 ACK ) 
25:2 tcp_slowtimo tcp_init tcp_maxidle 
25.3 tcp_slowtimo t_idle t_idle 
U U TCP | 
25.4 25-10 TCPT_2MSL 
25.5 25-12 FIN_WIN_2 75 ACK 
25.6 SO KEEPALIVE 1 
1 2 
25.7 tcp_rttdflt 
25.8 OOOO 25.60 Ú 




















































































































26.1 [Il 














tcp usrreg 





SYN PRU_SH 

















tcp output 


[| 26] TOP [| I 















































































































































P 














UTDOWN 















































PRU RCV 




















RU CONNECT 











































































































































































































PRU SENDOOB 














*tcp fasttimo 


*tcp timers 


*tcp timers 





















































ACK 











































































































































































































*tcp drop 
































*tcp disconnect 























FIN 











*tcp input 























ACK| 











*tcp input 



























































( ACK 


























































































































*tcp_input 
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tcp input 
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TCP 

































































tcp output 

















tcp output 


























































































































































































































































































































26.2 tcp output) [] 




















































































































































































































































































































































































































































































































































































































































































































tcp output 14 26-1 
1. ACK 
61 (snd_max) (snd_una) | 
ACK[] idle 24-17 idle[] 4-6 TCP 
2: 
62-68 TCP ACK 
| (t maxseg ) 
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(“ " RTT) 
RTT Net/3 
FEET: tcp output.c 
44 tcp output (tp) 
45 struct tcpcb *tp; 
46 ( 
47 struct socket *so = tp->t_inpcb->inp_socket; 
48 long len, win; 
49 int off, flags, error; 
50 struct mbuf *m; 
51 struct tcpiphdr *ti; 
52 u_char opt [MAX TCPOPTLEN] : 
53 unsigned optlen, hdrlen; 
54 int idle, sendalot; 
55 FE . 
56 * Determine length of data that should be transmitted 
57 * and flags that will be used. 
58 * If there are some data or critical controls (SYN, RST) 
59 * to send, then transmit; otherwise, investigate further. 
60 * f 
61 idle - (tp-»snd max -- tp-»snd una); 
62 if (idle && tp->t idle >= tp-»t rxtcur) 
63 /* 
64. * We have been idle for "a while" and no acks are 
65 * expected to clock out any data we send -- 
66 * slow start to get ack "clock" running again. 
67 *7 
68 tp->snd_cwnd = tp->t maxseg; 
69 again: 
70 sendalot - 0; /* set nonzero if more than one segment to output */ 





218 /* 

219 * No reason to send a segment, just return. 
220 */ 

221 return (0); 

222 send: 





489 if (sendalot) 



























































490 goto again; 
491 return (0); 
492 T 
tep output.c 
O 26-1 tcp output [100000 
3. 
69-70 send ip_output ip_output 





















































































































































682 










































































































































































China-pubecom 























































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
sendalot 1 ip_output 
26.3 000000000000 
tcp output 
PRU_RCVD 
TCP tcp output 
26-2 “ ” 
tcp_output.c 

71 off = tp->snd_nxt - tp->snd una; BED, 
72 win = min(tp->snd wnd, tp->snd_cwnd) ; 

73 flags = tcp_outflags[tp->t_statel; 

74 ZS 

75 * If in persist timeout with window of 0, send 1 byte. 

76 * Otherwise, if window is small but nonzero 

77 * and timer expired, we will send what we can 

78 * and go to transmit state: 

79 EL 

80 if (tp->t force) ( 

81 if (win == 0) { 

82 /* 

83 * If we still have some data to send, then 

84 * clear the FIN bit. Usually this would 

85 * happen below when it realizes that we 

86 * aren't sending all the data. However, 

87 * if we have exactly 1 byte of unsent data, 

88 * then it won't clear the FIN bit below, 

89 * and if we are in persist state, we wind 

90 * up sending the packet without recording 

91 * that we sent the FIN bit. 

92 * 

93 * We can't just blindly clear the FIN bit, 

94 * because if we don't have any more data 

95 *.to send then the probe will be the FIN 

96 * itself. 

97 */ 

98 if (off « so-»so snd.sb cc) 

99 flags &= "TH FIN; 
100 win - 1; 
101 ) else { 
102 tp->t timer[TCPT PERSIST] = 0; 
103 tp->t rxtshift = 0; 
104 ) 
105 ) 

tep output.c 
D 26-2 top output 000000000 
71-72 off 
snd una( ) 
win (snd wnd) (snd cwnd) 
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73 24-16 tcp_outflags flags 
TH_ACK|| TH FIN|| TH RST TH SYN 
TH PUSH|| TH URG 4 























































































































































































































































































































74-105 t force 










































































tcp output 











tp-»t force = 1; 
error = tcp output (tp); 
tp-»t force = 0; 

















































































































































































































































































































































































































































































































































































































































































































































































































TCP 
win 0 ( t_force ) 
FIN win 1 
win 
t_rxtshift 0 
26-3 tcp output 
- : tcp output.c 
106 len = min(so->so snd.sb cc, win) - off; 
107 if (len « 0) ( 
108 /* 
109 * If FIN has been sent but not acked, 
110 * but we haven't been called to retransmit, 
111 * len will be -1. Otherwise, window shrank 
112 * after we sent into it. If window shrank to 0, 
113 * cancel pending retransmit and pull snd nxt 
114 * back to (closed) window. We will enter persist 
115 * state below. If the window didn't close completely, 
116 * just wait for an ACK. 
117 */ 
118 len = 0; 
119 if (win == 0) ( 
120 tp->t_timer [TCPT_REXMT] = 0; 
121 tp->snd_nxt = tp->snd_una; 
122 } 
123 } 
124 if (len > tp->t_maxseg) { 
125 len = tp->t_maxseg; 
126 sendalot = 1; 
127 } 
128 if .(SEQ_LT(tp->snd_nxt + len, tp->snd_una + so->so_snd.sb_cc)) 
129 flags &= ^TH FIN; i 
130 win = sbspace (&so->so_rcv); 
tcp_output.c 
O 26-3 te output [D D UD U U D D D U 
1. 
106 len win( 
TCP 1 ) off off 
















































































































































































































































































684 
































China-pub.con 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP [l-2 
107-117 [UU len U D | i U 
U u u L | | 6[] TCP 
0000 4050600000 TCP S SE 
i i i 0 
snd wnæ= 0000 
(000000) 
1 2 3 4 5 6 7 8 9 
O000000 
snd una = 4 snd_nxt 210 
0000000 0000000 
DO 
[] 26-4 0040000000000 
ACK | TÚ 1007 | U elut 
1 26-5 
snd_wnd=1 
> 
1 2 3 4 5 6 8 9 
(0000000 
snd una =7 snd_nxt = 10 
üuggaagan 0000000 
000 
0 26-5 00470000000000000 
26-2[] [| 26-3| | 
off = snd_nxt - snd una = 10 - 7 = 3 
len = min(so snd.sb cc, win) -off = min(3, -3=-2 
DU O 70 80 9 
RFC 793[] RFC 1122 | O 0 [] U 
o RFC 791 0 å [] 
len 0 L [ FIN ( 26.2) 
26-6 

































































China-pubutom «was 685 



































o00000 > N 
snd_una =10 snd nxt = 11 


00000 000000 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































I OOOO 
D 26 000 1900000000000000000 
26-6 26-4 7-9 snd_una 10 
FIN TCP FIN snd_nxt 1( 
FIN ) snd_nxt 11 FIN 10 [] 26-2 26-3 

off = snd_nxt - snd una = - 10 = 

win = 6 

len = min( so snd.sb cc, win ) - off = min(0, 6) - 1 = -1 

6 

(0) 

3. 
118-122 len| 0 | 0 ou 

0 snd_nxt snd_una 0 0 0 0 0 

O O TCP 

4. 
124-127 | len] 
sendalot 1 26-1 tcp output 
| 

5.0 O O FIN 
128-129 0 0 FIN ( flags 

O) 26-7 
so snd.sb cc=1025 (0000) 











1 2 ... 512 513 514 Soe 1024 1025 


(IE —_o ——— 
uu (000 
snd una=1 sd nxt =513 
0000000 U D D DDD D 


D D D 


0267 DOOFNgo0 0000000 
512 ( O O op TCP 
[] (512-1024 ) 1 (1025[] [] ) LU 
















































































































































































































































































































































































686 TCP/IP 2 Chinapub.tom 
— =E 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































len=512( ) 26-3 C 
SEQ LT (1025, 026) 
FIN TCP 1025 
6. 
130 win TCP 
TCP 
( SWS 1[] 22.30 ) 
26-8 
tcp output.c 
131 /* Liao 
132 * Sender silly window avoidance. If connection is idle 
133 * and can send all data, a maximum segment, 
134 * at least a maximum default-sized segment do it, 
135 * or are forced, do it; otherwise don't bother. 
136 * If peer's buffer is tiny, then send 
137 * when window is at least half open. 
138 * If retransmitting (possibly after persist timer forced us 
139 * to send into a small window),. then must resend. 
140 */ 
141 if (len) ( i 
142 if (len == tp->t_maxseg) 
143 goto send; 
144 if ((idle || tp->t_flags & TF_NODELAY) && 
145 len + off >= so->so_snd.sb_cc) 
146 goto send; 
147 if (tp-»t force) 
148 goto send; 
149 if (len >= tp-»max sndwnd / 2) 
150 goto send; 
151 if (SEQ LT(tp->snd nxt, tp-»snd max)) 
152 goto send; 
153 H 
tcp output.c 
D 26-8 tp output OO0O000000000000 
7. 
142-143 
144-146 ACK(idlel JJ ) Nagle (TF. NODELAY[] [] ) 
TCP Nagle ( 1[] 19.4[] ) 
TCP 
TCP NODELAY (U Telnet[] Rlogin) 
if TCP Nagle 
147-148 TCP 
149-150 
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max sndwnd|] tcp input 
TCP 
151-152 snd max 
25-26 snd nxt snd una snd nxt 
snd max 
26-9 tcp output TCP 
tcp output.c 
154 /* HES 
155 * Compare available window to amount of window 
156 * known to peer (as advertised window less 
157 * next expected input). If the difference is at least two 
158 * max size segments, or at least 50% of the maximum possible 
159 * window, then want to send a window update to peer. 
160 if 
161 if (win > 0) { 
162 /* 
163 * "adv" is the amount we can increase the window, 
164 * taking into account that we are limited by 
165 * TCP MAXWIN << tp-»rcv. scale. 
166 */ 
167 long adv = min(win, (long) TCP_MAXWIN << tp->rcv scale) - 
168 (tp->rcv adv - tp-»rcv nxt); 
169 if (adv >= (long) (2 * tp-»t maxseg)) 
170 goto send; j 
171 if (2 * adv >= (long) so->so rcv.sb hiwat) 
172 goto send; 
173 } 
tcp_output.c 
D 26-9 tcp output [0000000000000000 
154-168 
min (win, (long) TCP MAXWIN << tp-»rcv scale) 
(win) TCP 
(tp->rev adv - tp->rcv_nxt) 
TCP adv 
tcp input rcv nxt|| tcp output 
rev adv( 26-32) 
24-18 40 50 6 26-10 
tcp_output 
adv 3 3 (| 10[] 11[] 12) 
169-170 
TCP u (ACK- 
every-other-segment)” ( ) 


























088 





TCP/IP 2 Chibasbub to 









































win=6000000 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































4 5 6 7 8 9 10 1 12 13 14 
rev_nxt=7 rcv adv - 10 
00000000 O00000000 
0 26-10. DO00 4050 6000 241800000000 
171-172 
26-11 tcp_output TCP 
tcp_output.c 

174 /* RUP 

175 * Send if we owe peer an ACK. 

176 */ 

177 if (tp->t flags & TF_ACKNOW) 

178 goto send; 

179 if (flags & (TH SYN | TH RST)) 

180 goto send; 

181 if (SEQ GT(tp->snd up, tp-»snd una)) 

182 goto send; 

183 {* 

184 * If our state indicates that FIN should be sent 

185 * and we have not yet done so, or we’re retransmitting the FIN, 

186 * then we need to send. 

187 */ 

188 if (flags € TH_FIN && 

189 ((tp->t_flags € TF_SENTFIN) == 0 || tp->snd_nxt == tp->snd_una)) 

190 goto send; 

tcp_output.c 
U 26-11 tcp output [0000000000000 
174-178 TF ACKNOW ACK 
TF ACKNOW 200 ms ACK ( 

) | SYN | FIN 
179-180 flags SYN[] RST 
181-182 snd_up 

PRU_SENDOOB OT 30-9) 
183-190 flags FIN FIN FIN 
FIN TF_SENTFIN 
tcp_output 26-12 
191-217 (so_snd.sb_cc ) 
| L| 

218=221 tcp_output 
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tcp output.c 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































191 /* 

192 * TCP window updates are not reliable, rather a polling protocol 

193 * using 'persist' packets is used to ensure receipt of window 

194 * updates. The three 'states' for the output side are: 

195 * idle not doing retransmits or persists 

196 * persisting to move a small or zero window 

197 * (re) transmitting and thereby not persisting 

198 i 

199 * tp->t timer[TCPT PERSIST] 

200 * is set when we are in persist state. 

201 * tp->t force 

202 * is set when we are called to send a persist packet. 

203 * tp->t timer[TCPT REXMT] 

204 * is set when we are retransmitting 

205 * The output side is idle when both timers are zero. 

206 * 

207 * I£ send window is too small, there is data to transmit, and no 

208 * retransmit or persist is pending, then go to persist state. 

209 * If nothing happens soon, send when timer expires: 

210 * if window is nonzero, transmit what we can, 

211 * otherwise force out a byte. 

212 * 

213 if (so->so snd.sb cc && tp->t_timer[TCPT_REXMT] == 0 && 

214 tp->t_timer[TCPT_PERSIST] == 0) { 

215 tp->t_rxtshift = 0; 

216 tcp setpersist(tp); 

217 } 

218 /* 

219 * No reason to send a segment, just return. 

220 */ 

221 return (0); 

tcp output.c 
D 26-12 top output 000000000 
100 50 512 
TCP 26-8 
(144-146[] ) 100 
50 26-8 
( TCP ACK) 

Nagle t force 4096[] 50 

2048 50 ACK 

ACK 50 
Nagle 
26.12 
TCP[] “ i 1024 
4096 


















































































































































690 






































China-pubecom 









































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP [] 2 
LU | U SYN[] ACK i i | |[] 4096 26-13| 
rcv nxt|[| rcv adv U L 
gd AA e at 
EE ESTER 4 
| I 
AA NE EEE 4 
m =1 rcv adv = 4097 
000000 O00000000 
O 26-13 JI0OO0O0O000000 4096 
1-1024 | tcp. input[] JJ | Ml ACK[] [] | 
1024] | 0 ([] 28-13) | rcv. nxt[] | 26-14 | 
. 000000 =3072 
E SSE a 
NEEN å 
rev nxt = 1025 rcv. adv = 4097 
OOO00dg O00000000 
[l] 26-14 [J 26-1370 000000 1-1024 0000000 
JU 1024 30-60 
PRU_RCVD O 0 tcp output[] | | Ú 
| L tcp output[] rcv nxt[] rcv. adv O O 26- 
14 4096 
1024 26-9| 
adv = min(4096, 65535) - (4097 - 1025) 
= 1024 
TCP MAXWIN[][] 65535 | U DU | 0 0 | 
U 20430 0 Ul | ACK 200ms 
ACK 
TCP D 1025-2048[] tcp input | | 0 
ACK qu H I 1024 O | [] rev nxt 
26-15] 
000000 =3072 
AA COR 
1025 2048 i 


I 














rev_nxt = 2049 
0000000 





! 


rcv adv - 4097 
O00000000 


D 26-15 026-140 000000 1025-2048] 0000000 
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1024-2048 tcp. output[] rcv. nxt[] rcv. adv 
26-15 1024 4096 
26-9 
adv = min(4096, 65535) - (4097 - 2049) 
= 2048 
2049 
4096 2049-6145 
rcv adv 6145 
200ms 
ACK 
" [] o ACK{] [] [| ACK 
0 
26.4 TCPO O 
TCP] tcp_output 0 
26-16 Net/3 

000000 

100 
0000 kindi 

10 D 

ne [000000 

00 100 20 0 

kind=3 | len=3 
0000000 KEEN hos 

100 100 10 D 








0000 kind=8 | len=10 O000 U 0 00000 


100 100 400 f 400 


O 26-16 Net/30 00 TCO O 























1 kin (kind=0[] kind=1) 1 
3 len kind 














































































































































































































































































































69 2 TCP/IP 2 






















































































































































































China-pub.con 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































kind len 
—— MSS — 
1) TCP ( ACK[] SYN) SYN 
tcp. do rfc1323 ( 1) Net/3 
tcp newtcpcb 
2) SYN[] | 28-20 29-2 
3) TCP SYN 
( ACK[] SYN) 26-23 
27.5 MSS Net/3 
kinds al] 5[] 6[] 7 ACK 
RFC 1072[Jacobson and Braden 1998] 26-16 
ACK RFC 
1323 TCP| T/TCP (RFC 1644[Braden 1994] 1[] 24.7 
) 3 kinds 110 120 13 
26.5 000000 
RFC 1323 TCP 16 bit (O 24- 
10) ( RTT ) (long 
fat pipe) 1 24.3 TCP 
26-16 0( ) 14 1 073 725 
440 (65535x 2") Net/3 32 bit 16 bit 
| SYN 
TCP snd_scale[] rcv. scale 
0 | 16 bit 
snd scale 32 bit (O 28-6) 
32 bit rcv scale TCP 
16 bit 
TCP SYN 
rcv scale 
26.6 00000 
ACK 



































































































































RFC 1323 













































































26 TCP 




















693 



























































ACK 




























































































RTT 
























































26-17 































































































last_ack_sent 


ts_val “ts_ecr 7 


ts_recent 


tcp now-ts ecr = RIT 


ts recent age 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































0 26-17 DOO0O0O000000000 
tcp now 0 500 ms 1( 

25-8) TCP 3 

*ts recent ( = u 

) 
ts recent age tep_recent tcp_now 
“last ack sent (ti ack) ({] 26-32) 
ACK rev nxt 

tcp input ts vall| ts ecr 

ts val 

e ts ecr| 

4 0x0101080a RFC 1323 A 
1 NOP kind 8 len 
10 NOP 32 bit 32 
bit 26-17 12 
(Net/3 ) (Y 28-10) 
26-16 10 NOP 
( 28.4) 
ACK RTT tcp now[] ts_ecr 500ms 
Net/3 
TCP PAWS (protection against wrapped sequence 

number)[] 28.7 PAWS ts_recent_age 

tcp output tcp now 







































































































































































694 1m China-bub.co 
































































































































































































































































































































































































































































































































































































































































































































2 
ts_recent (U 26-24) 
UI RST 
26.6.1 O RFC 13230 0 
TCP ts recent[] 
L i | RFC 1323 
ti_seq <= last_ack_sent < ti_seq + ti_len 

















26-18] I CU Ú 









































if (ts present && SEQ_LEQ(ti->ti_seq, tp->last ack sent) && 
SEQ LT(tp->last ack sent, ti->ti seg + ti->ti_len)) { 
tp->ts recent age = tcp now; 
tp->ts recent = ts val: 





0 26-18 OO0O00O000000000000 
















































































































































































































































































































































































ts_present 
tcp input 28-11 28-35 
0 0 Ü 26-19 15 | LU 
3 ti len 3 


























































































































last ack sent 


0030| 3 4 5 0000 


0050] 5 6 7 Jong 


O 26-19 O00005000000000000 


4 1 28-11 




































































































































































SEO LEO 




















un 


EO LT 20 30 4 


































































































































































































SEO LEO SEQ LT 2 | 2 










































































26 




















TCP 














695 













































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































3 1 5 
SEQ LEO 
ts recent [Braden 1993] 
1) 26-19 1] 2 
last ack sent 1 ts recent ACK 4 
last ack sent A(rcv. nxt ) 26-19 
2) ACK 
3) 10 2[] 3 26-19 1 
26-18 SEQ LT ts recent 
4) TCP ACK 4 ts recent 
1 RTT ( ) 
ACK ACK 
RTT ACK 
26-18 0 
rs_recent ( 24 28.7 
PAWS ) ( 
ACK) 
26.6.2 
Net/3 26-18 [Braden 1993] 26-20 
if (ts present && TSTMP GEQ(ts val, tp->ts recent) && 
SEQ LEO(ti->ti seg, tp->last_ack_sent)) { 
0 2620 TODO ON 
(ts_val) 
(ts_recent) 26-19 5 
TSTMP_GEO 24-21 SEQ GEQ 32 bit 
26.6.3 | ACK 
ACK RTT 26-17[] TCP 
ts_recent RTT 
ACK 
26-20 26-18 ACK 
26-21 4[] 5 














































































































































































































696 TCP/IP D 2 China*pub.tom 
— n iii 


rcv_wnd=6[] 0000 


4 5 6 7 8 9 10 11 


t 


rev nxt 
last ack sent 


! 


ti seq 


O 26-21 O0004050000000000 












































[] ti seg | last ack sent[]ts recent rcv nxt 2 
ACK | O ACK || || 
































































































































































































































26-22] [| 




















rev wnd-6[] 0000 














last ack sent rcv nxt 


| 


ti_seq 


U 26-22 000607000000 


E 


000 














ts_recent 














ti seq[| || last ack sent[] 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP] [| 4-7[] ACK ACK 0 
U U OD O 405 0 i (Y 26-24)[] O 26-22 
ACK[] | rcv_nxt last_ack_sent 
26.7 000000.0 
tcp output == TCP 0 
IP] O 
26-23 | SYN | MSS[] | 
223-234 TCP opt optlen | ( 
E ) SYN[] 0 snd_nxt ut E (iss)[]l] | ut 
TCP PRU, CONNECT O O iss 0 tcp input 
TCP iss 0 iss tcp iss 
235 TF_NOOPT 00000 U U DD 0 D U 
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SYN MSS 
Net/1 tcp newtcpcb t_flags[] 0 “ 
"[] TF. NOOPT Net/1 
MSS 
tcp_output.c 
223 PA cp. ip 
224 * Before ESTABLISHED, force sending of initial options 
225 * unless TCP set not to do any options. 
226 * NOTE: we assume that the IP/TCP header plus TCP options 
227 * always fit ina single mbuf, leaving room for a maximum 
228 * link header, i.e. 
229 * max linkhdr + sizeof (struct tcpiphdr) + optlen <= MHLEN 
230 */ 
231 optlen = 0; 
232 hdrlen = sizeof (struct tcpiphdr); 
233 if (flags € TH_SYN) { 
234 tp->snd_nxt = tp->iss; 
235 if ((tp->t flags & TF NOOPT) == 0) { 
236 u short mss; 
237 opt [0] = TCPOPT MAXSEG; 
238 opt [1] = 4; 
239 mss = htons((u short) tcp mss(tp, 0)); 
240 bcopy((caddr t) & mss, (caddr t) (opt + 2), sizeof(mss)); 
241 optlen - 4; 
242 if ((tp->t flags & TF REQ SCALE) && 
243 ((flags & TH ACK) -- { | 
244 (tp->t flags & TF_RCVD_SCALE))) { 
245 *((u_long *) (opt + optlen)) = htonl(TCPOPT_NOP << 24 | 
246 TCPOPT_WINDOW << 16 | 
247 TCPOLEN_WINDOW << 8 | 
248 tp->request_r_scale); 
249 optlen += 4; 
250 } 
251 } 
252 } 
tcp_output.c 
D 26-23 tcp output OOOOOO0O0syNooggo 
1. MSS 
236-241 opt[0] 2(TCPOPT MAXSEGJ[] opt [1] 4 MSS 
tcp mss MSS 27.5 bcopyl] 16 bit MSS 
opt 1210 opt 1310 ( 26.5) Net/3 SYN MSS 
2. 
242—244 TCP (TH ACK ) 
SYN 25-21[] TCP 
Eep-do.rfcl323 ( ) t flags 
TF REQ SCALE | TF REQ TSTMP 














3. 






































245-249 

































































3 (U 26-16) 1 NOP 























































































































698 





China-pub.con 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
4 4 PRU_CONNECT 
request_r_scale tcp_input SYN 
RFC 1323 TCP 0 
TCP 
0 
26-24 tcp_output 
tcp_output.c 
253 £* Riant 
254 * Send a timestamp and echo-reply if this is a SYN and our side 
255 * wants to use timestamps (TF_REO_TSTMP is set) or both our side 
256 * and our peer have sent timestamps in our SYN’s. 
257 * 
258 if ((tp->t flags & (TF_REQ_TSTMP | TF_NOOPT)) == TF REQ TSTMP && 
259 (flags & TH RST) == 0 && š 
260 ((flags & (TH_SYN | TH_ACK)) == TH_SYN || 
261 (tp->t_flags & TF RCVD TSTMP))) ( 
262 u long *lp = (u_long *) (opt + optlen); 
263 /* Form timestamp option as shown in appendix A of RFC 1323. */ 
264 *]p++ = htonl(TCPOPT TSTAMP HDR); 
265 *lp++ = htonl(tcp now); 
266 *lp = htonl(tp->ts recent); 
267 optlen += TCPOLEN TSTAMP APPA; 
268 } 
269 hdrlen += optlen; 
270 [> 
271 * Adjust data length if insertion of options will 
272 * bump the packet length beyond the t_maxseg length. 
273 Er 
274 if (len > tp->t maxseg - optlen) { 
275 len = tp->t_maxseg - optlen; 
276 sendalot = 1; 
277 } 
tcp output.c 
U 26-24 tcp output 0 DO DD 00 0 U D 0 
4. 
253-261 3 (1)TCP 
(2) RST (3) (flags[] SYN ACK 
) TCP (TF RCVS TSTMP) MSS 
5. 
263-267 (26.6[] ) 12 (TCPOLEN TSTAMP APPA) 4 
0x0101080a( TCPOPT_TSTAMP_HDR) 26-17 tcp. now( 
500ms ) tcp input ts recent 
6. 
270-277 TCP optlen (len) 
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MSS (optlen) sendalot 
([] 26-1) 
MSS SYN Net/3[] [] SYN 
MSS MSS 
12 
26-25 tcp output IP[] TCP 
mbuf (len 0) 
Tr m tcp_output.c 
279 * Grab a header mbuf, attaching a copy of data to 
280 * be transmitted, and initialize the header from 
281 * the template for sends on this connection. 
282 */ 
283 if (len) { 
284 if (tp->t force && len == 1) 
285 tcpstat.tcps_sndprobe++; 
286 else if (SEQ_LT(tp->snd_nxt, tp->snd_max)) { 
287 tcpstat .tcps_sndrexmitpack++; 
288 tcpstat.tcps_sndrexmitbyte += len; 
289 } else { 
290 tcpstat.tcps_sndpack++; 
291 tcpstat.tcps sndbyte += len; 
292 ) 
293 MGETHDR (m, M DONTWAIT, MT HEADER); 
294 if (m -- NULL) ( 
295 error - ENOBUFS; 
296 goto out; 
297 } 
298 m->m data += max linkhdr; 
299 m->m len = hdrlen; 
300 if (len <= MHLEN - hdrlen - max linkhdr) { 
301 m copydata(so->so snd.sb mb, off, (int) len, 
302 mtod(m, caddr t) + hdrlen): 
303 m->m len += len; 
304 ) else { 
305 m->m_next = m_copy (so->so_snd.sb_mb, off, (int) len); 
306 if (m->m_next == 0) 
307 len = 0; 
308 } 
309 /* 
310 * If we're sending everything we've got, set PUSH. 
311 * (This will keep happy those implementations that 
312 * give data to the user only when a buffer fills or 
313 * a PUSH comes in.) 
314 */ 
315 if (off + len == so->so.snd.sb cc) 
316 flags |= TH PUSH; 


U 26-25 tcp output IJ000000000 PO te 0 00 Ü mbuf 






































284-292 










































































































































































t_force 1 


























snd nxt 






























































































































































snd max 








700 TCP/IP 























, China«bubcoM 

































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































8 IP[] TCP mbuf 
293-297 MGETHDR mbu mbuf IP[] TCP 
( ) tcp output ( write) 
tcp input 
M DONTWAIT “ out” 26-32 
9. [] mbu 
298-308 44 (100-40-16 TCP ) m_copydata 
mbu m_copy mbuf 
mbuf 2.9 
m copy m copy 
10. PSH 
309-316 TCP PSH 
PSH 
tcp input Net/3 PSH 
26-26 tcp output len 0 else 
TCP 
tcp output.c 
317 ) else ( /* len == 0 */ pr 
318 if (tp->t flags & TF ACKNOW) 
319 tcpstat.tcps_sndacks++; 
320 else if (flags & (TH_SYN | TH_FIN | TH_RST)) 
321 tcpstat.tcps sndctrl++; 
322 else if (SEQ GT(tp->snd up, tp->snd una) ) 
323 tcpstat.tcps sndurg++; 3 
324 else 
325 tcpstat.tcps sndwinup-*; 
326 MGETHDR(m, M DONTWAIT, MT HEADER); 
327 if (m == NULL) ( 
328 error = ENOBUFS; 
329 goto out; 
330 } 
331 m->m data += max_linkhär; 
332 m->m len = härlen; 
333 ) 
334 m-»m pkthdr.rcvif = (struct ifnet *) 0; 
335 ti = mtod(m, struct tcpiphdr *); 
336 if (tp->t template == 0) 
337 panic("tcp output"); 
338 bcopy ((caddr t) tp->t template, (caddr_t) ti, sizeof(struct tcpiphdr)); 
tcp output.c 
D 26-26 tcp output 0000000000 PO TCP] U O mbuf 
11. 
318-325 TF ACKNOW 0 ACK 
SYN[] FIN[] RST end qna 
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12. IP[] TCP mbuf 
326-335 mbu IP[] TCP 
13. [] mbu IP[] TCP 
336-338 Lbcopyll IPL] TCP t template mbuf 
tcp template 
26-27 tcp output TCP 
tcp_output.c 
339 /* cp_outp 
340 * Fill in fields, remembering maximum advertised 
341 * window for use in delaying messages about window sizes. 
342 * If resending a FIN, be sure not to use a new sequence number. 
343 */ : 
344 if (flags & TH FIN && tp->t_flags & TF_SENTFIN && 
345 tp->snd_nxt == tp-»snd max) 
346 tp->snd_nxt--; 
347 /* 
348 * If we are doing retransmissions, then snd nxt will 
349 * not reflect the first unsent octet. For ACK only 
350 * packets, we do not want the sequence number of the 
351 * retransmitted packet, we want the sequence number 
352 * of the next unsent octet. So, if there is no data 
353 * (and no SYN or FIN), use snd max instead of snd nxt 
354 * when filling in ti, seg. But if we are in persist 
355 * state, snd max might reflect one byte beyond the 
356 * right edge of the window, so use snd nxt in that 
357 * case, since we know we aren't doing a retransmission. 
358 * (retransmit and persist are mutually exclusive...) 
359 */ 
360 if (len || (flags & (TH SYN | TH FIN)) || tp->t timer[TCPT PERSIST]) 
361 ti-»ti seq = htonl(tp-»snd nxt); 
362 else 
363 ti-»ti seq = htonl(tp->snd max); 
364 ti->ti ack = htonl(tp-»rcv nxt); 
365 if (optlen) { 
366 bcopy ((caddr_t) opt, (caddr_t) (ti + 1), optlen); 
367 ti->ti off = (sizeof (struct tcphdr) + optlen) >> 2; 
368 } 
369 ti->ti_flags = flags; 
tep output.c 
[] 26-27 tcp output JO [ O [] ti seq [| ti ack [| ti flags 
14. FIN snd nxt 
339-346 TCP FIN 26-28 TH FIN 
TF SENTFIN snd nxt snd max FIN 
(O 26-31) FIN snd nxt 1( O FIN ) 
snd_nxt 
15. 
347-363 snd_nxt snd_max 





































































































































































































(1) (Jen OLU (2) SYN FIN (3) 





























































































































702 TCP/IP 



































































































































































































































China-pubecom 




















































































































































































































































































































































































































































































































2 
1 2 3 4 5 6 7 8 9 FIN 
o00000 ` 
snd, una = 10 snd nxt = 11 
snd max = 11 
U 26-28 FIND JI I D HBD B 0 
16. 
364 rcv_nxt 
17. 
365-368 TCP (optlen 0) TCP TCP 
bit (O 24-10[] th off) TCP (20 ) 
4 32 bit TCP 
369 TCP flags 
26-29 TCP TCP 
tcp_output.c 
370 £* nd 
371 * Calculate receive window. Don't shrink window, 
372 * but avoid silly window syndrome. 
373 */ 
374 if (win < (long) (so-»so rcv.sb hiwat / 4) && win < (long) tp->t maxseg) 
375 win = 0; 
376 if (win > (long) TCP MAXWIN << tp->rcv scale) 
377 win = (long) TCP MAXWIN << tp->rcv scale; 
378 if (win < (long) (tp-»rcv adv - tp->rcv_nxt)) 
379 win = (long) (tp->rcv adv - tp->rcv_nxt); 
380 ti->ti win = htons((u short) (win >> tp-»rcv scale)); 
381 if (SEQ GT(tp->snd up, tp->snd_nxt)) ( 
382 ti->ti urp = htons((u short) (tp->snd up - tp-»snd nxt)); 
383 ti->ti flags |= TH URG; 
384 ) else 
385 /* 
386 * If no urgent pointer to send, then we pull 
387 * the urgent pointer to the left edge of the send window 
388 * so that it doesn’t drift into the send window on sequence 
389 * number wraparound. 
390 */ 
391 tp->snd_up = tp->snd_una; /* drag it along */ 
392 £* 
393 * Put TCP length in extended header, and then 
394 * checksum extended header and data. 
395 */ 
396 if (len + optlen) 
397 ti->ti len = htons((u short) (sizeof(struct tcphdr) + 
398 optlen + len)); 
399 ti->ti_sum = in_cksumím, (int) (hdrlen + len)); 
tcp. output.c 


U 26-29 tcp output U D 0 U 0 TCP 0 0 0 0 0 0 D 0 D 














18. 
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26 TCP 
370-375 (ti_win) 
26-3 win win 
l/A(so rcv.sb hiwat) 0 
1/4 
19. 
376-377 win 
20. 
378-379 26-10 rcv adv rcv nxt 
win 
( win 0) 
1 22-3 
21. 
381-383 (snd_up) snd_nxt TCP TCP| 
16 bit URG 
TCP 
URG 
26-30 
send(fd, buf, 3, MSG OOB); 
send Berkeley 
24-10 32 bit (snd up) 
TCP 16 bit (ti urp) 
65535 
| snd nxt 
65535 16 bit 65535 
16 bit 26.6 
384-391 | TCP (snd_una) 
392-399 TCP TCP STE 
TCP so snd.sb cc =3 
t template IP[] TCP ([] 26-26) P Ë š 
IP ( 23-19 
UDP ) 4 
26-31 tcp output SYN snd_una snd_up=7 
FIN PS [| PRU_SENDOOB] [] 
22. 0000000 =3 
400-405 TCP H tcp. output] D 
startseq 26-31 


















































































































































D2e30 1000000200 
O000000 












































704 an 0: China+pub.com 
EE HE 
















































































































































































































































































































































































400 7* tcp output.c 
401 * In transmit state, time the transmission and arrange for 
402 * the retransmit. In persist state, just set snd max. 
403 */ 
404 if (tp-»t force == || tp->t timer[TCPT PERSIST] == 0) { 
405 tcp seg startseg = tp->snd nxt; 
406 ya 
407 * Advance snd_nxt over sequence space of this segment. 
408 */ 
409 if (flags & (TH SYN | TH FIN)) { 
410 if (flags & TH SYN) 
411 tp->snd_nxt++; 
412 if (flags & TH_FIN) { 
413 tp->snd nxt++; 
414 tp->t flags |= TF SENTFIN; 
415 ) 
416 ) 
417 tp->snd nxt += len; 
418 if (SEQ GT(tp-»snd nxt, tp->snd max)) { 
419 tp->snd max = tp->snd nxt; 
420 Z8 
421 * Time this transmission if not a retransmission and 
422 * not currently timing anything. 
423 */ 
424 if (tp-»t rtt -- 0) ( 
425 tp-»t rtt = 1; 
426 tp->t rtseq = startseq; 
427 tcpstat.tcps_segstimed++; 
428 } 
429 } 
430 /* 
431 * Set retransmit timer if not currently set, 
432 * and not doing an ack or a keepalive probe. 
433 * Initial value for retransmit timer is smoothed 
434 * round-trip time + 2 * round-trip time variance. 
435 * Initialize counter which is used for backoff 
436 * of retransmit time. 
437 */ 
438 if (tp->t_timer[TCPT_REXMT] == 0 && 
439 tp->snd_nxt != tp->snd una) { 
440 tp->t_timer [TCPT_REXMT] = tp->t_rxtcur; 
441 if (tp->t_timer[TCPT_PERSIST]) { 
442 tp->t timer[TCPT PERSIST] = 0; 
443 tp->t_rxtshift = 0; 
444 } 
445 } 
446 } else if (SEQ GT(tp->snd nxt + len, tp->snd_max)) 
447 tp->snd max = tp->snd nxt + len; 
tep output.c 
U 26-31 tee output [J0000000000000 
23. snd nxt 
406-417 SYN[] FIN snd nxt FIN 
TF SENTFIN snd nxt (len) 0 
24. snd max 
418-419 snd nxt snd max snd max 












































































































































China pubscon «us 705 


420-428 RTT[] (t_rtt=0) (t_rtt=]) 
| t_rtseql| [|| tcp. input ACK 
RTT 25.10 | 


if (tp->t_rtt && SEQ GT(ti->ti ack, tp->t_rtseg)) 
tcp_xmit_timer (tp, tp->t rtt); 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































25. 
430-440 
t rxtcur RTT tcp xmit timer t rxtcur 
snd nxt snd una( snd nxt len) ACK 
441-444 
26. 
446-447 t_force ( 26-31 
if else ) snd max len 1 
tcp output 26-32 
ip output 
tcp output.c 
448 ya Ber 
449 * Trace. 
450 +) 
451 if (so->so_options & SO_DEBUG) 
452 tcp trace(TA OUTPUT, tp->t state, tp, ti, 0); 
453 /* 
454 * Fill in IP length and desired time to live and 
455 * send to IP level. There should be a better way 
456 * to handle ttl and tos; we could keep them in 
457 * the template, but need a way to checksum without them. 
458 #7, 
459 m-»m pkthdr.len = härlen + len; 
460 ((struct ip *) ti)->ip len = m->m_pkthär.len; 
461 ((struct ip *) ti)-»ip ttl = tp-»t inpcb-»inp ip.ip ttl; /* XXX */ 
462 ((struct ip *) ti)-»ip tos = tp-»t inpcb-»inp ip.ip tos; /* XXX */ 
463 error = ip output(m, tp->t inpcb-»inp options, &tp-»t inpcb-»inp route, 
464 So-»so options & SO DONTROUTE, 0); 
465 if (error) ( 
466 out: 
467 if (error == ENOBUFS) { 
468 tcp quench(tp-»t inpcb, 0); 
469 return (0); 
470 } 
471 if ((error == EHOSTUNREACH || error == ENETDOWN) 
472 && TCPS_HAVERCVDSYN (tp->t_state)) ( 
473 tp->t_softerror = error; 
474 return (0); 
475 } 
476 return (error); 
477 } 


[] 26-32 tcp output. JO O T] pop 00000 


706 
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478 tepstat.tcps_sndtotal++; 
479 LE 
480 * Data sent (as far as we can tell). 
481 * If this advertises a larger window than any other segment, 
482 * then remember the size of the advertised window. 
483 * Any pending ACK has now been sent. 
484 * 
485 if (win > 0 && SEQ GT(tp-»rcv nxt + win, tp-»rcv adv)) 
486 tp-»rcv adv = tp-»rcv nxt + win; 
487 tp->last ack sent = tp->rcv nxt; 
488 tp->t flags &= ^(TF ACKNOW | TF DELACK); 
489 if (sendalot) 
490 goto again; 
491 return (0); 
492 ) 
tcp output.c 
[] 26-32 (O) 
27: 
448-452 SO_DEBUG tcp_trace TCP 
27.10 
28. IP TTL[] TOS 
453-462 IP 3 IP TTL[] TOS 23-19 
3 
" XXX" TTL[] TOS 
| TCP 
IP 
29. [] IP 
463-464 ip output TCP TCP SO DONTROUTE 
IP SO DONTROUTE ip output 
SO BROADCAST SO DONTROUTE 
connect SO BROADCAST 
467-470 IP[] mbuf ENOBUFS 
tcp_quench 
TCP 0(OK) 
udp output([] 23-20) TCP ( 
) mbu TCP 
ACK ACK 
471-475 SYN 
tcp. output[] tcp. usrreq ( 30 
PRU CONNECT!|| PRU SEND|| PRU SENDOOB|| PRU SHUTDOWN ) 
tcp. output tcp output tcp input 
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30. rcv adv[] last ack sent 
479—486 (rev nxt win) rcv adv 
26-9 rcv adv 26-29 
TCP 
487 | L | last ack sent tcp input IUU 
(0 26-6) 
488 ACK| TF ACKNOW|| TF DELACK 
31. 
489—490 sendalot again[] (U 26-1) 
([] 26-3) TCP 
26.8 tcp templatel[|[] 
tcp. newtcpcb( JU TCP 
( PRU_CONNECT 
SYN)[] tcp. template IP[] TCP 
tcp output 
26-33 tcp template 
: tcp subr.c 
59 struct tcpiphdr * 
60 tcp template (tp) 
61 struct tcpcb *tp; 
62 ( 
63 struct inpcb *inp = tp->t inpcb; 
64 struct mbuf *m; 
65 struct tcpiphdr *n; 
66 if ((n = tp-»t template) == 0) ( 
67 m = m get (M DONTWAIT, MT HEADER); 
68 if (m == NULL) 
69 return (0); 
70 m-»m len = sizeof(struct tcpiphdr); 
71 n = mtod(m, struct tcpiphdr *); 
72 } 
73 n->ti_next = n->ti prev = 0: 
74 n->ti x1 = 0; 
75 n->ti pr = IPPROTO TCP; 
76 n->ti len = htons (sizeof (struct tcpiphdr) - sizeof(struct ip)); 
77 n->ti_src = inp->inp laddr; 
78 n->ti dst = inp->inp faddr; 
79 n->ti sport = inp->inp_lport; 
80 n->ti_dport = inp->inp fport; 
81 n->ti seg = 0; 
82 n->ti_ack = 0; 
83 n->ti_x2 = 0; 
84 n->ti off = 5; /* 5 32-bit words = 20 bytes */ 
85 n->ti flags = 0; 
86 n->ti win = 0; 
87 n->ti sum = 0; 
88 n->ti_urp = 0; 
89 return (n); 
90 T 
tcp_subr.c 


[] 26-33 tcp template [0000 IPITCPODDDO 
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TCP/IP 2 

1. mbuf 
59-72 IP[] TCP mbu mbu TCP 
t_template 0 tcp inputi 
M DONTWAIT 

2. 
73-88 IP[] TCP O[] ti pr TCP[] IP (6) 
ti len 20[] TCP ti off 5[] TCP 32 bit 

Internet PCB IP IP TCP TCP U 

3. [] O TCP JOD | 
73-88 IP[] TCP | TCP 
23.6 UDP 23-19 udpiphdr 

tcp template||ti next||ti prev 0 
26.9 tcp. respond[| |] 
tcp. respond ip. output IP 
1)tcp input RST ACK 
2)tcp timers 
TCP tcp respond tcp output 
tcp. drop O O tep. output] O [| RST 
RST tcp respond 
26-34 tcp respond 
tcp. subr.c 

104 void iz 

105 tcp_respond(tp, ti, m, ack, seq, flags) 

106 struct tcpcb *tp; 

107 struct tcpiphdr *ti; 

108 struct mbuf *m; 

109 tcp seq ack, seq; 

110 int flags; 

111 ( 

112 int tlen; 

113 int win = 0; 

114 struct route *ro - 0; 

115 if (tp) ( 

116 win = sbspace(&tp-»t, inpcb->inp socket-»so rcv); 

117 ro = &tp-»t inpcb-»inp route; 

118 3 

119 if (m == 0) ( /* generate keepalive probe */ 

120 m = m_gethdr (M_DONTWAIT, MT HEADER); 

121 if (m == NULL) 

122 return; 

123 tlen = 0; /* no data is sent */ 

124 m->m data += max_linkhdr; 

125 *mtod(m, struct tcpiphdr *) = *ti; 


O 26-34 tcp respond [000000 
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126 ti - mtod(m, struct tcpiphdr *); 
127 flags - TH ACK; 
128 ) else ( /* generate RST segment */ 
129 m freem(m-»m next); 
130 m-»m next - 0; 
131 m-»m data - (caddr t) ti; 
132 m->m len = sizeof(struct tcpiphdr); 
133 tlen = 0; 
134 #define xchg(a,b,type) { type t; t=a; a=b; b=t; T 
135 xchg (ti->ti_dst.s_addr, ti->ti_src.s_addr, u long); 
136 xchg (ti->ti_dport, ti->ti_sport, u_short); 
137 #undef xchg 
138 3 
tcp_subr.c 
O 26-34 (0) 
104-110 26-35 3 tcp_respond 
[] U 
tp ti m ack seg flags 
0000 ACKO RST tp ti m 0 ti_ack TH_RST 
ti seq + TH RST| 
00 0 ACKO RST tp ti m ti len " TH ACK 
00000 tp t_template NULL rev nxt snd una 0 
O 26-35 tcp respond 000 
tp TCP ( ) ti IP[] TCP m 
mbuf RST 3 
113-118 tcp input RST 
( SYN ) 
tp winl| ro tp 
ro tcp_input 
1. 
119-127 m mbu 
TCP m m_gethdr 
IP[] TCP mbuf[] TCP tlen 0 
4.2BSD 
TCP COMPAT 42[] Net/3 
tlen 1 0 
( ) 















































































































































































































































ti TCP mbuf| E 
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TCP/IP 2 
mbuf] 
2. RST 
128-138 tcp input RST RST 
mbuf| tcp respond IP TCP 
mbuf ( ) n free mbuf IP 
TCP IP IP 
26-36 tcp_respond 
- - tcp subr.c 
139 ti->ti len = htons((u short) (sizeof(struct tcphdr) 4 tlen)); 
140 tlen += sizeof(struct tcpiphdr); 
141 m->m len = tlen; 
142 m->m pkthdr.len = tlen; 
143 m->m_pkthär.rcvif = (struct ifnet *) 0; 
144 ti->ti next = ti->ti prev = 0; 
145 ti->ti x1 = 0; 
146 ti->ti seq = htonl (seq); 
147 ti->ti ack = htonl (ack); 
148 ti-»ti x2 = 0; 
149 ti->ti off - sizeof(struct tcphdr) >> 2; 
150 ti->ti flags = flags; 
151 if (tp) 
152 ti->ti win - htons((u short) (win >> tp-»rcv. scale)); 
153 else 
154 ti-»ti win = htons((u short) win); 
155 ti-»ti urp = 0; 
156 ti->ti sum = 0; 
157 ti->ti sum = in, cksum(m, tlen); 
158 ((struct ip *) ti)-»ip len = tlen; 
159 ((struct ip *) ti)-»ip ttl - ip defttl; 
160 (void) ip output(m, NULL, ro, 0, NULL); 
161 ) 
tcp. subr.c 
U 26-36 tcp respond U D 0 D D 0 
139—157 TCP IP[] TCP 
tcp template t template 
ip output 
26.10 UI 
TCP (tcp output) RST 
(tcp. respond) 
TCP 
tcp output 
( ) TCP ( ) 
TCP 
tcp output 
( ) 













































































































































































Chi a-bubıcoN 











26 TCP 























711 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP Net/3 
SYN ( 
SYN SYN 
U U 
26.1 26-1 TCP 
TCP 
26.2 26-6 FIN len 0 
FIN 
26.3 Net/3 
tcp do rfc 1323 
26.4 25-28 RTT 8 
RTT 
26.5 26-23 bcopy MSS mss opt[2] 
26.6 26-29 
( TCP 
) 
26.7 26-32 ENOBUFS (1) 
(2) ACK 
ACK RST 
26.8 10 20-30) PSH 
26.9 26-36 ip_defttl TTL 26-32 PCB 
26.10 IP TCP 26-25 mbuf) 
26.11 tcp output ( 500 ) 
IP SYNL FIND URG C 
ip output 
26.12 26.3 100 50 
writev write 
200[] 300 100[] 50 writev 
26.13 tcp now 500ms 
TCP 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































5*1 Hf 
TCP] [| O O TCP 
*tcp_drain | mbu 
*tcp drop RST 
*tcp close TCP FIN 4 
1[] 18.2 4 
*tcp mss MSS TCP MSS MSS 
*tcp ctlinput TCP ICMP 
tcp notify ICMP tcp_quench ICMP 
*TCP REASS tcp_reass 
*tcp trace TCP ( SO DEBUG) trpt 
(8) 
27.2 tcp. drain[|[] 
tcp drain TCP pr_drain mbu 
m_reclaim 10-32 ip_drain 
UDP | TCP mbuf —— 
— [| Net/3 TCP mbuf mbuf 
tcp drain (| TCP IP 
27.3 tcp_drop|| |] 
tcp_drop RST | 
(tcp disconnect ) FIN TCP 
27-1 | tcp. drop 77 000000 errno 
27-2 tcp_drop 
202-213 TCP SYN RST[] tcp. drop 
CLOSED tcp output 24- 16 CLOSED tcp_outflags 
RST 
214-216 errno ETIMEDOUT (|| EHOSTUNREACH) 
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| uut | ETIMEDOUT] 0 0 Ú] ul) 
217 tcp_closel] 




























































































































































































o O errno U [ 
tcp input ENOBUFS 020000005YN0 000000 t template 0000 
mbuf 
tcp_input ECONNREFUSED OOORSTIOOOOOOSYNOOO 
tcp input ECONNRESET 00000000 RST 
tcp_timers ETIMEDOUT 0000000 3000000000 ACKO 25-25) 


C) 


O0000000000 


tcp timers ETIMEDOUT OO (025-1600 Ü 
00000 O000000000 


tcp usrreq ECONNABORTED PRU, ABORT[] [] 


HO 
E] 



























































so LiNGEN][][] D D D D D D 0 


tcp usrreq 0 Dl 























U 27-1 0 0 tee. drop JO D] errno 0 U 



























































































































































































































































































































































































































































































































































































































































































































































tcp subr.c 

202 struct tcpcb * 

203 tcp drop(tp, errno) 

204 struct tcpcb *tp; 

205 int errno; 

206 ( 

207 struct socket *so = tp->t inpcb-»inp socket; 

208 if (TCPS, HAVERCVDSYN(tp-»t state)) { 

209 tp->t state = TCPS CLOSED; 

210 (void) tcp output (tp) ; 

211 tcpstat.tcps drops++; 

212 ) else 

213 tcpstat.tcps, conndrops++; 

214 if (errno == ETIMEDOUT && tp-»t softerror) 

215 errno - tp-»t softerror; 

216 SO-»SO error = errno; 

217 return (tcp close(tp)); 

218 ) 

tcp subr.c 
[] 27-2 tcp drop DD 
27.4 tcp close[l|[] 
LU U U | LAST ACK | [| ACK[] tcp input 
tcp. close 2MSL TIME WAIT[] 
CLOSED tcp timers O tcp. close] | 0 
| | | tcp close (IP[] TCP 
TCP Internet PCB ) 
3 
27.4.1 oou 
rt_metrics (O 18-26)[] 9 6[] O TCP 8 












































































































































714 
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TCP/IP 2 
route (8) (9 rmx pksent ) 27-3 
route -lock rmx_locks ([] 20-13) RTV xxx 
U 
[] TCP | | 
tcp close 3 — RTT RTT 
tcp. close] J] tcp. mss[] [] 
rt metrics] J 00000 00000 route(8)[] D D D 
rmx_expire -expire 
rmx hopcount -hopcount 
rmx mtu . -mtu 
rmx recvpipe . -recvpipe 
rmx rtt . . -rtt 
rmx rttvar . . -rttvar 
rmx_sendpipe . -sendpipe 
rmx_ssthresh . . -ssthresh 
O 27-3 TCPO QQ rt metrics [I] D D D Ú D 
27-4 tcp_close 
1. 
234-248 8192 (sb_hiwat) 
0 131 072 (16) 0 Å ) 
g ( 19.2) 
NX 2%N>D)Y NX 22+131072(N>1) 
|l! 
4G 
Internet 
( ) 
route 
( 19.2) 
250 27-3[] 0 
2. RTT 
251-264 t_srtt 8 ([] 25-19) rmx_rtt 
t_srtt 000 000(RTM_RTTUNIT) 2( ) 8 RTT 
rmx rtt E Ü] | L L 
rmx_rtt 
3. 
265-273 RTT 4 t_rttvar 
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tep subr.c 





225 struct tcpcb * 
226 tcp close(tp) 
227 struct tcpcb *tp; 



































































































































































































































































































































228 ( 
229 struct tcpiphdr *t; 
230 struct inpcb *inp - tp-»t inpcb; 
231 struct socket *so = inp->inp socket; 
232 struct mbuf *m; 
233 struct rtentry *rt; 
234 /* 
235 * If we sent enough data to get some meaningful characteristics, 
236 * save them in the routing entry.  'Enough' is arbitrarily 
237 * defined as the sendpipesize (default 8K) * 16. This would 
238 * give us 16 rtt samples assuming we only get one sample per 
239 * window (the usual case on a long haul net). 16 samples is 
240 * enough for the srtt filter to converge to within 5$ of the correct 
241 * value; fewer samples and we could save a very bogus rtt. 
242 * 
243 * Don't update the default route's characteristics and don't 
244 * update anything that the user "locked". 
245 */ 
246 if (SEQ LT(tp->iss + so-»so snd.sb hiwat * 16, tp->snd max) Eë 
247 (rt - inp-»inp route.ro rt) && 
248 ( (struct sockaddr in +) rt key(rt))-»sin addr.s addr !- INADDR ANY) { 
249 u long i; - 
250 if ((rt-»rt rmx.rmx locks & RTV RTT) == 0) ( 
251 i = tp-»t srtt * i 
252 (RTM RTTUNIT / (PR SLOWHZ * TCP_RTT_SCALE)); 
253 if (rt->rt_rmx.rmx_rtt && i) 
254 /* 
255 * filter this update to half the old & half 
256 * the new values, converting scale. 
257 * See route.h and tcp var.h for a 
258 * description of the scaling constants. 
259 */ 
260 rt-»rt rmx.rmx rtt - 
261 (rt-»rt rmx.rmx rtt + i) / 2; 
262 else 
263 rt-»rt rmx.rmx rtt - i; 
264 } 
265 if ((rt-»rt rmx.rmx locks € RTV RTTVAR) == 0) í 
266 i = tp->t_rttvar * 
267 (RTM RTTUNIT / (PR SLOWHZ * TCP RTTVAR SCALE) ); 
268 if (rt->rt rmx.rmx rttvar && i) 
269 rt-»rt rmx.rmx rttvar = 
270 (rt-»rt rmx.rmx rttvar + i) / 2; 
271 else 
272 rt-»rt rmx.rmx rttvar - i; 
273 ) 
: tcp_subr.c 
0 27-4 tcp close [1D IJ] DJ PJ RTTI L JI] 1 
27-5 tcp_close 
274-283 (1) (rmx_ssthresh DO (2) 
rmx_sendpipe snd_ssthresh rmx_sendpipe 
TCP rmx_ssthresh 
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TCP/IP 2 
TCP 
24 a tcp_subr.c 
275 * update the pipelimit (ssthresh) if it has been updated 
276 * already or if a pipesize was specified & the threshhold 
277 * got below half the pipesize. I.e., wait for bad news 
278 * before we start updating, then update on both good 
279 * and bad news. 
280 */ 
281 if ((rt->rt rmx.rmx locks & RTV SSTHRESH) == 0 && 
282 (i = tp->snd ssthresh) && rt->rt rmx.rmx ssthresh | | 
283 i < (rt-»rt rmx.rmx sendpipe / 2)) { 
284 få 
285 * convert the limit from user data bytes to 
286 * packets then to packet data bytes. 
287 */ 
288 i = (i + tp->t_maxseg / 2) / tp->t_maxseg; 
289 if (i < 2) 
290 i = 2; 
291 i *= (u long) (tp->t maxseg + sizeof(struct tcpiphdr)); 
292 if (rt->rt_rmx.rmx_ssthresh) 
293 rt->rt rmx.rmx ssthresh = 
294 (rt->rt rmx.rmx ssthresh + i) / 2; 
295 else 
296 rt->rt rmx.rmx ssthresh = i; 
297 ) 
298 ) 
tcp_subr.c 
[] 27-5 tcp close 020200000000 
284-290 snd_ssthresh MSS(t_maxseg) 
1/2t maxseg snd ssthresh 
291-297 MSS IP[] TCP (40) 
rmx ssthresh 27-4 ( 1/2 1/2) 
27.4.2 00 
27-6 tcp_close 
Jug S tcp subr.c 
/* free the reassembly queue, if any */ 
300 t = tp-»seg next; 
301 while (t !- (struct tcpiphdr *) tp) ( 
302 t - (struct tcpiphdr *) t-»ti next; 
303 m - REASS MBUF((struct tcpiphdr *) t->ti prev); 
304 remque(t-»ti prev); 
305 m_freem (m) ; 
306 } 
307 if (tp->t_template) 
308 (void) m_free (dtom(tp->t_template)); 
309 free(tp, M_PCB); 
310 inp->inp_ppcb = 0; 


0 27-6 tcp close 000000000 
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311 soisdisconnected (so); 
312 /* clobber input pcb cache if we're closing the cached connection */ 
313 if (inp == tcp last inpcb) 
314 tcp last, inpcb = &tcb; 
315 in pcbdetach (inp); 
316 tcpstat.tcps_closed++; 
317 return ((struct tcpcb *) 0); 
318 3 
tcp_subr.c 
[27-6 di? 
1. mbuf 
299-306 
27.9 
Ze TCP 
307-309 m_free IP[] TCP free TCP 
sodisconnected PRU_DISCONNECT 
3. PCB 
310-318 Internet PCB TCP TCP[] PCB 
tcp_last_inpcb in_pcbdetach PCB 
27.5 tcp_mssl] [] 
tcp_mss 
1)tcp output SYN MSS 
2)tcp input SYN MSS 
tcp mss MSS 
27-7 tcp mss PCB 
tcp_input.c 
1391 int Kani 


1392 tcp mss(tp, offer) 
1393 struct tcpcb *tp; 


` 1394 u_int offer; 
1395 ( 
1396 struct route *ro; 
1397 struct rtentry *rt; 
1398 struct ifnet *ifp; 
1399 int rtt, mss; 
1400 u_long bufsize; 
1401 struct inpcb *inp; 
1402 struct socket *so; 
1403 extern int tcp mssdflt; 
1404 inp = tp-»t inpcb; 
1405 ro = &inp->inp route; 
1406 if ((rt = ro-»ro rt) == 


(struct rtentry *) 0) 


t 


U 27-7 tæmss UUDUDPCRBUDUDUDODDDUO UD D U 
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1407 /* No route yet, so try to acquire one */ 

1408 if (inp->inp_faddr.s_addr != INADDR_ANY) { 

1409 ro->ro_dst.sa_family = AF_INET; 

1410 ro->ro_dst.sa_len = sizeof (ro->ro_dst); 

1411 ((struct sockaddr in +) &ro->ro dst)->sin addr = 

1412 inp->inp faddr; 

1413 rtalloc (ro); 

1414 } 

1415 if ((rt = ro->ro_rt) == (struct rtentry *) 0) 

1416 return (tcp mssdflt); 

1417 } 

1418 ifp = rt->rt_ifp; 

1419 so = inp->inp_socket; tep_input.c 
[| 297 103 

1. 
1391-1417 rtalloc 
ifp MTU TCP MSS 
512(tcp_mssdflt) 
27-8 tcp_mss 
t_rttmin|| t_srtt[|| t rttvar 





























































































































1420 MO T7T m A  I$SË2_Ü20x1put.c 


1420 
1421 
1422 
1423 
1424 
1425 
1426 
1427 
1428 
1429 
1430 
1431 
1432 


1433 
1434 
1435 
1436 
1437 
1438 
1439 


1440 
1441 
1442 
1443 


* While we're here, check if there's an initial rtt 
* or rttvar. Convert from the route-table units 

* to scaled multiples of the slow timeout timer. 

*/ 


if (tp->t_srtt == 0 && (rtt = rt->rt rmx.rmx rtt)) I 


) 


/* 
* XXX the lock bit for RTT indicates that the value 
* is also a minimum value; this is Subject to time. 
*/ 
if (rt->rt rmx.rmx locks & RTV RTT) 
tp->t rttmin = rtt / (RTM RTTUNIT / PR SLOWHZ); 
tp->t_srtt = rtt / (RTM RTTUNIT / (PR SLOWHZ * TCP RTT SCALE)); 


if (rt-»rt rmx.rmx rttvar) 
tp->t_rttvar = rt-»rt rmx.rmx rttvar / 
(RTM RTTUNIT / (PR SLOWHZ * TCP RTTVAR SCALE) ) ; 
else 
/* default variation is +- 1 rtt */ 
tp->t rttvar = 
tp->t srtt + TCP RTTVAR SCALE / TCP RTT SCALE; 


TCPT RANGESET (tp->t_rxtcur, 
((tp->t srtt >> 2) + tp-»t rttvar) >> 1, 
tp->t rttmin, TCPTV REXMTMAX) ; 


———— — n HEH inpul.c 





U 278 tepmss J)00000000000RTQO00 





2. 





























RTT 






































1420-1432 













































































RTT (c_srtt=0) rmx_rtt 
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RTT t_srtt RTV_RTT 
RTT(t_rttmin) rmx_rtt tcp newtcpcb 
t rttmin 20 0 
rmx rtt( ) t srtt([]8 ) 27-4 
t_rttmin t_srttl] 1/8 TCP RTT SCALE 
3. RTT 
1433-1439 rmx rttvar( ) t rttvar([]4 
) t rttvar t rtt | | RTT 
+1 RTT | t. rttvar 4 t rtt 8 
t srtt 
4. RTO 
1440-1442 RTO t rxtcur 
RTO=srtt+2X rttvar 
RTO 2 4 25-21 
terte N 
tørte t rttvar 4 BEE 
RTO =——-n x ——ə = 
8 4 2 
TCPT_RANGESET 
27-9 tcp_mss MSS 
tcp_input.c 
1444 /* cp-mp 
1445 * if there's an mtu associated with the route, use it 
1446 */ 
1447 if (rt-»rt rmx.rmx mtu) 
1448 mss = rt->rt rmx.rmx mtu - sizeof(struct tcpiphdr); 
1449 else ( 
1450 mss = ifp-»if mtu - sizeof(struct tcpiphdr); 
1451 #if (MCLBYTES & (MCLBYTES - 1)) -- 0 
1452 if (mss » MCLBYTES) 
1453 mss &= "(MCLBYTES - 1); 
1454 #else 
1455 if (mss » MCLBYTES) 
1456 mss - mss / MCLBYTES * MCLBYTES; 
1457 #endif 
1458 if (!in_localaddr (inp->inp_faddr)) 
1459 mss = min(mss, tcp_mssdflt); 
1460 } . 
tcp_input.c 
[] 27-9 tcp mss 000090 mss 
5. MTU MSS 
1444-1450 | | MTU mss mss 
MTU 40(IP[] TCP ) MSS 1460 
6. MSS MCLBYTES 
1451-1457 mss MCLBYTES mss 
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TCP/IP 2 
MCLBYTES(mbu ) MCLBYTES[ ( 1024] 2048)[] MCLBYTES 
1 MCLBYTES 2 1024(0x400) 1023(0x3ff) 
0 
mss | mss MCLBYTES | 
mbuf 1024[] mss 1023 (OxfffffCO0) 10 bit 
mss 1460 1024 mbuf 2048 2047 
(Oxffff8000) 11 bit MTU 4464 
mss[] 4424 4096 MCLBYTES 2 mss MCLBYTES 
| MCLBYTES mss MCLBYTES | 
7. 
1458-1459 IP (in localaddr ) mss 
512(tcp mssdflt) mss 512 
IP subnetsarelocal 
SUBNETSARELOCAL 1 IP 
I ID 0 
IP IP 
MSS IP 
WAN MTU 1006 ARPANET 10 11.7 
WAN 1500 MTU 
1[] 24.2 MTU (RFC 1191[] [Mogul and Deering 19901) 
Net/3 MTU 
27-10 tcp mss 
8. MSS 
1461-1472 tcp mss|[| tcp input offer mss 
mss offer mss 1024 
512 mss 512 mss 536( MTU 
576) 1460[] TCP 536 mss 
tcp mss[] tcp. output offer 0 MSS 
mss 32 
1473-1483 mss tcp. newtcpcb t maxseg(512) | [| TCP 
MSS (offer ) rmx sendpipe 
(high-water) (U 16-4) mss 
rmx sendpipe 
8192 mss 
9. MSS 
1484-1489 mss sb. max(Net/3 
262 144 256X 1024) sbreserve 
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8192 TCP mbuf| 2048( mss 1460) 
8760( 6X 1460) mss 512 8192 
"TES 7^ tcp. input.c 
1462 * The current mss, t maxseg, was initialized to the default value 
1463 * of 512 (tcp mssdflt) by tcp newtcpcb(). 
1464 * If we compute a smaller value, reduce the current mss. 
1465 * If we compute a larger value, return it for use in sending 
1466 * a max seg size option, but don't store it for use 
1467 * unless we received an offer at least that large from peer. 
1468 * However, do not accept offers under 32 bytes. 
1469 */ 
1470 if (offer) 
1471 mss = min(mss, offer); 
1472 mss - max(mss, 32); /* sanity */ 
1473 if (mss < tp-»t maxseg || offer != 0) ( 
1474 qe 
1475 * If there's a pipesize, change the socket buffer 
1476 * to that size. Make the socket buffers an integral 
1477 * number of mss units; if the mss is larger than 
1478 * the socket buffer, decrease the mss. 
1479 */ 
1480 if ((bufsize = rt->rt rmx.rmx sendpipe) == 0) 
1481 bufsize = so->so_snd.sb_hiwat; 
1482 if (bufsize < mss) 
1483 mss = bufsize; 
1484 else { 
1485 bufsize = roundup(bufsize, mss); 
1486 if (bufsize > sb max) 
1487 bufsize = sb_max; 
1488 (void) sbreserve(&so->so snd, bufsize); 
1489 } 
1490 tp->t_maxseg = mss; 
1491 if ((bufsize = rt->rt rmx.rmx recvpipe) == 0) 
1492 bufsize = so-»so rcv.sb hiwat; 
1493 if (bufsize > mss) ( 
1494 bufsize = roundup(bufsize, mss); 
1495 if (bufsize » sb max) 
1496 bufsize - sb max; 
1497 (void) sbreserve(&so-»so rcv, bufsize); 
1498 J 
1499 } 
1500 tp->snd_cwnd = mss; 
1501 if (rt-»rt rmx.rmx ssthresh) { 
1502 /* 
1503 * There's some sort of gateway or interface 
1504 * buffer limit on the path. Use this to set 
1505 * the slow start threshhold, but set the 
1506 * threshold to no less than 2*mss. 
1507 */ 
1508 tp->snd_ssthresh = max(2 * mss, rt->rt rmx.rmx ssthresh); 
1509 } 
1510 return (mss); 
1511 } 





tcp_input.c 
U 27-10 tcp mss [000000 


1490 t_maxseg (512) MSS 
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China-pub.com 








































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































1491-1499 
10. 
1500-1509 snd_cwnd 
rmx ssthresh (snd ssthresh) 
1510 mss[] tcp. input ([] 28-10 MSS 
JO D O 26-23 tcp. output[] [J MSS 
i | tcp_mss i L L 
SYN | | O MSS SYN 
1) tcp_newtcpcb t_maxsegl] 512 
2) connect SYN MSS tcp_output 
tcp_mss offer IP mbu 2048 
27-9 mss 1460 offer 27-10 mss 
1460 1460 (512) MSS 
tcp_output MSS MSS 1460 
3) SYN mss 1024|] tcp. input tcp_mss offer 
1024 27-9 mss[] 1460 U U 27-10 min mss 
1024 offer 1024 ( 8192)[] t. maxseg 
1024 
tcp mss U O TCP mss 1460 
mss 1024 TCP 1024 
1460 1024 
1460 27-10 mss 
TCP mss[] 1460 mss 1024 
1460 1024 
27.6 tep_ctlinput[] [| 
22-32 tcp_ctlinput 5 ICMP 0 
TCP[] UDP 
4 TCP tcp_ctlinput 
27-11 tcp_ctlinput 23-301] udp_ctlinput 
365-366 [] tcp. ctlinputl] odp ctlinput O OO ICMP 
inetctlerrmap OL] UDP TCP 
notify tcp_notify tcp_quench 





























China-pubutom ma 723 
































































































































































































































































































































































































































tcp_subr.c 
355 void 
356 tcp_ctlinput (cmd, sa, ip) 
357 int cmd; 
358 struct sockaddr *sa; 
359 struct ip *ip; 
360 { 
361 struct tcphdr “th; 
362 extern struct in_addr zeroin_addr; 
363 extern u_char inetctlerrmap[]; 
364 void (*notify) (struct inpcb *, int) = tcp notify; 
365 if (cmd == PRC QUENCH) 
366 notify = tcp_quench; 
367 else if (!PRC IS REDIRECT (cmd) && 
368 ((unsigned) cmd > PRC_NCMDS || inetctlerrmap[cmd] == 011 
369 return; E 
370 if (ip) ( f 
371 th = (struct tcphdr *) ((caddr_t) ip + (ip->ip_hl << 2)); 
372 in pcbnotify(&tcb, sa, th->th_dport, ip->ip_src, th-»th sport, 
373 cmd, notify); 
374 ) else 
375 in pcbnotify(&tcb, sa, 0, zeroin addr, 0, cmd, notify); 
ie tcp_subr.c 
[] 27-11 tcp ctlinput ID 
27.7 tcp notify[] [] 
tcp notify||tcp ctlinput 
UDP TCP 
27-12 tcp motify 
tcp subr.c 


328 void 
329 tcp notify(inp, error) 
330 struct inpcb *inp; 


331 int error; 

332 ( 

333 struct tcpcb *tp - (struct tcpcb *) inp-»inp ppcb; 
334 Struct socket *so - inp-»inp socket; 

335 / 


* 
336 * Ignore some errors if we are hooked up. 
337 * If connection hasn't completed, has retransmitted several times, 
338 * and receives a second error, give up now. This is better 

* 


339 than waiting a long time to establish a connection that 

340 * can never complete. 

341 * A 

342 if (tp->t_state == TCPS_ESTABLISHED && 

343 (error == EHOSTUNREACH || error == ENETUNREACH || 

344 error == EHOSTDOWN)) { 

345 return; 

346 } else if (tp->t state < TCPS_ESTABLISHED && tp->t_rxtshift > 3 && 
347 tp->t_softerror) 


348 so->so_error = error; 


0 27-12 tcp notify 00 





724 


349 
350 
351 
352 
353 
354 } 


TCP/IP 2 









































else 
tp->t_softerror = 


sorwakeup (so); 
sowwakeup (so); 





error; 
wakeup ( (caddr_t) & so->so_timeo); 


O 27-12 (0) 





328-345 
EHOSTDOWN 




































































ESTABLISHED 
































EHOSTUNREACH 


China-pubecom 


tcp. subr.c 




















ENETUNREACH 















































Net/2 



























































































































































































































































tcp xmit timer 





ACK 


























































































































346-353 




















TCP 














t softerror 















































































































































































































































select 









































t softerror 













































































tcp drop 








tcp drop 
























































t softerror 


| 
27.8 tcp quench[] [] 













































































































































































errno 



















































































27-13 






































tcp  quench | 





| TCP 





















































































































































tcp input 






































ip output 
































tp output 





381 void 

382 tcp quench(inp, errno) 
383 struct inpcb *inp; 

384 int errno; 

385 ( 


386 struct tcpcb *tp - 


387 
388 
389 ) 


if (tp) 
tp->snd_cwnd 


[l] 22.43 





ENOBUFS 
























































intotepcb (inp); 


tp->t_maxseg; 


tcp_quench 




































































tcp_subr.c 


tcp_subr.c 
































































































































tcp timers 
































































































































snd ssthresh 





















































27.9 TCP_REASS|| || tcp. reass[l |] 





TCP | | | 
































































































































TCP|| [] | 













































































27 TCP 


725 


















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































mbuf () 
0 - 1023 ( [made 144 
) 2048 - 3071 Damn 
|m flags ` ` Ju PKTHDR 
TCP | mæpkthår.len |44 
n pkthdr. revit [pir 
( 1024 - i 
2047 ) Å x 
TCP tcp. iS tipe em 
E Ras eno 
mbu IP TCP 2000) 
4 ( 2-14 
) 27-14 
70 80 90 10 yeu 
24-12 tcpiphdr 
ipovlyl| tcphdr tcphdr 40000 
24-12 27-14 
ti nextl|ti prev 
ti len[|| ti dport|| ti seq 
TCP 
seg next O 27-14 QOO00 400000 PQ Ter] [J 
seg_prev[| ti next[] ti prev IP 8 TCP 
ti_len TCP TCP 
27.9.1 TCP_REASS 
tcp_input 27-15 TCP_REASS 
TCP_REASS 29-22 
54-63 tp TCP ti tcpiphdr 
3 
1) ( ti seq rcv nxt) 
2) (seg next mbuf) 
3) ESTABLISHED 
ACK rev nxt 
TCP FIN flags TH FIN 




















































































































































































































































































































726 


TCP/IP 2 












































China=pub,com 








































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































- - tcp input.c 
53 #define TCP REASS(tp, ti, m, so, flags) ( \ 
54 if ((ti)->ti seq == (tp)-»rcv nxt Eë \ 
55 (tp) ->seg_next == (struct tcpiphdr *) (tp) && \ 
56 (tp)-»t state == TCPS ESTABLISHED) ( N 
57 tp->t flags |= TF DELACK; \ 
58 (tp)-»rcv.nxt += (ti)-»ti len; \ 
59 flags = (ti)->ti flags & TH FIN; \ 
60 tcpstat.tcps_revpack++; \ 
61 tcpstat.tcps rcvbyte += (ti)->ti_len; \ 
62 sbappend (& (so) ->so_rcv, (m)); A 
63 sorwakeup (so); \ 
64 } else { \ 
65 (flags) = tcp_reass((tp), (ti), (m)); \ 
66 tp->t_flags |= TF_ACKNOW; \ 
67 IN 
68 ) " 
tcp input.c 
[] 2715 XE mass I N0O000000000000 
3 
SYN 
ESTABLISHED 
64—67 3 TCP REASS TCP REASS 
TF ACKNOW ACK[] TCP 
ACK (29.4[] ) 
TCP_REASS 27-14[] TCP 
ti sport[] ti dport TCP TCP REASS 
TCP mbu 
27-14 IP[] TCP mbuf 
dtom 2.6 m pullup IP[] TCP 
( 2-16 JU dtom 
TCP TCP mbuf| (back pointer) TCP 
27-16 
mbu TCP seg_next 
seg_prev ti_next 
l(rcv_nxt) 
1461-4380 TCP m_devget 
mbuf| 2-16 






















































































Chi a*pUbeCom 





27 TCP 






































tcpcb{} 


seg_prev 


rev nxt 





mbuft{} 


m_nextpkt 
m_len 


m pkthdr.len 
m pkthdr.rcvif 
m ext.ext buf 
m ext.ext free 
m ext.ext, size 




















20480 0 0 


14600 000 





mbuf () 
m next 
m nextpkt 
m len 
m type 
M EXT 
m pkthdr.len 


m ext.ext, free 


20480 0 O 

ti_next 
ipovly() 
(200 0 ) 
tcphdr() 
(200 0 ) 


14600 0 00 









































































































































































































































































































































0 27-16 DO DD TCP 0000 mbufi (] 
TCP 32 bit mbu TCP_REASS 
27.9.2 TCP_REASS 
27-17 TCP_REASS tp TCP 
IP[] TCP m mbuf 


















































































































































































































































728 rem a China+pub.tom 
$a DD 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































| ti DI m[] D mbu | | | | 
tcp_input.c 
69 int PE 
70 tcp_reass(tp, ti, m) 
71 struct tcpcb *tp; 
72 struct tcpiphdr *ti; 
73 struct mbuf *m; 
74 ( 
75 struct tcpiphdr *q; 
76 struct socket *so = tp->t_inpcb->inp_socket; 
77 int flags; 
78 ZS 
79 * Call with ti==0 after become established to 
80 * force pre-ESTABLISHED data up to user socket. 
81 */ 
82 if (ti == 0) 
83 goto present; 
84 /* 
85 * Find a segment that begins after this one does. 
86 */ 
87 for (q = tp-»seg next; q !- (struct tcpiphär *) tp; 
88 q = (struct tcpiphdr *) q->ti next) 
89 if (SEQ GT(q-»ti. seq, ti-»ti seq)) 
90 break; i 
tcp input.c 
H 27-17 træ mass NO 00000 
69-83 TCP SYN tcp input TCP REASS 
ti (U 28-20 29-2) SYN 
(TCP REASS ) 
" present” 27-23 
84-90 seg_next 
(ti seg) for if 
27-18 q 
10-15 ti next 
ti prev | |] [] (ti seq) [] (ti len) 0 
| EL O mbuf 27-14 





























































































































ti_seq=10 


0 27-18 0000000000000 





China+pub.tom mo 




















729 





























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































27-19 TCP REASS 
tcp_input.c 
91 pe RR 
92 * I£ there is a preceding segment, it may provide some of 
93 * our data already. If so, drop the data from the incoming 
94 * segment. If it provides all of our data, drop us. 
95 */ 
96 if ((struct tcpiphdr *) g->ti prev != (struct tcpiphdr *) tp) { 
97 int i; 
98 q = (struct tcpiphdr *) q->ti prev; 
99 /* conversion to int (in i) handles seg wraparound */ 
100 i = q-»ti seq + q-»ti len - ti-»ti seq; 
101 if (i > O) { 
102 if (i >= ti->ti_len) ( 
103 tcpstat.tcps_revduppack++; 
104 tcpstat.tcps rcvdupbyte += ti->ti_len; 
105 m_freem(m) ; 
106 return (0); 
107 } 
108 m_adj(m, i); 
109 ti->ti_len -= i; 
110 ti->ti_seq += i; 
111 } 
112 q = (struct tcpiphdr +) (q->ti_next); 
113 } 
114 tepstat.tcps_rcvoopack++; 
115 tcpstat.tcps rcvoobyte += ti->ti_len; 
116 REASS_MBUF (ti) = m; /* XXX */ Ñ 
tcp input.c 
DH 27-19 TOS Rass II 00000 
91-107 q 
q q (U 27-18 4-8 ) 
i 
i = q->ti_seq + q->ti len - ti->ti_seq; 
= 4 + 5 -7 
= 2 
i 0 
(i) 
108-112 (0 D 27-180 0)0 madj i 
q 27-20 
27-18 
116 mbuf m TCP 
TCP mbu dtom REASS_MBUF 








































































































































































































#define REASS_MBUF (ti) (*(struct mbuf **)&((ti)->ti_t)) 


ti_t 

































































tepharl] D ( 24-12) 


















































16bit 












































27-19 























“ XXX ” 



















































































































































































bit 





























32 












































730 TCP/IP 2 China-bubıtoM 
— __ 


EE G [5 [6 [7 [8 | 





02720 p00000000070800000 27-18 






































































































































27-21 tcp_reass 





















































































































































117-135 
















































































ait 27-18 
i=9 + 2 — 10 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































10 
1 3 
1) i 0 
2) å (q->ti len) m adj 
i 
3) i 
136-139 insque 27-22 
27-18 
tcp_input.c 

117 JE vr 
118 * While we overlap succeeding segments trim them or, 

119 * if they are completely covered, dequeue them. 

120 Fr 

121 while (q != (struct tcpiphdr *) tp) { 

122 int i = (ti->ti seq + ti->ti_len) - q->ti seg; 

123 if (i <= 0) 

124 break; 

125 if (i < q-»ti len) { 

126 q->ti seq += i; 

127 q->ti len -= i; 

128 m adj (REASS_MBUF (q), 1); 

129 break; 

130 3 

131 q = (struct tcpiphdr +) g->ti next; 

132 m = REASS MBUF((struct tcpiphdr *) g->ti prev); 

133 remgue(g->ti prev); 


D 27-21 tœ mass II 00000 





731 


O 271 TCP| 




















134 m freem(m); 

135 H 

136 Zë 

137 * Stick new segment in its place. 
138 *7 

139 insque (ti, q->ti prev); 


tcp. input.c 


O 27-21 (0) 








02722 p000000000000 27-20 











































































































U 27-231] tcp reass[]| U U UD D D UD D D 0 D 00 U 
140 Present: PE 
141 /* 

142 * Present data to user, advancing rcv nxt through 
143 * completed sequence space. 

144 */ 

145 1f (TCPS_HAVERCVDSYN(tp->t_state) == 0) 

146 return (0); 

147 ti = tp->seg_next; 

148 if (ti == (struct tcpiphdr *) tp || ti->ti_seq != tp->rcv_nxt) 
149 return (0); 

150 if (tp->t state == TCPS_SYN_RECEIVED && ti->ti_len) 
151 return (0); 

152 do { 

153 tp->rcv_nxt += ti->ti len; 

154 flags = ti->ti flags & TH FIN; 

155 remque(ti); 

156 m = REASS MBUF (ti); 

157 ti = (struct tcpiphdr +) ti->ti next; 

158 if (so->so state & SS CANTRCVMORE) 

159 m freem(m); 

160 else 

161 sbappend(&so-»so rcv, m); 

162 } while (ti != (struct tcpiphdr *) tp && ti->ti seq == tp-»rcv nxt); 
163 sorwakeup (so); 

164 return (flags); 

165 } 


tcp_input.c 
O 27-23 tcp reass 0000000 


732 


















































































































































China-pubecom 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
145-146 SYN( LISTEN SYN SENT ) 
TCP_REASS 0 
flags FIN TCP_REASS 29-22 
SYN[] FIN ( ) 
147-149 ti 
(ti->ti seq) (rev nxt) 0 
27-22 
4 rcv nxt 2 2[] 3 
4-15 0 FIN ( ) 
FIN 
150-151 SYN_RCVD 0 
SYN 
152-164 ( 
) rev nxt 
flags ( ) 0 TH FIN 
FIN 
mbuf sorwakeup 
27.10 tcp trace|| |] 
26-32 IP tcp output tcp trace 
if (so->so options & SO DEBUG) 
tcp trace(TA OUTPUT, tp->t state, tp, ti, 0); 
trpt (8) 
TCPDEBUG tcpconsdebug 
TCP SO_DEBUG TCP 
trpt 
SO DUBUG (L) UDP IP) TCP 
tcp debug 27-24 
35-43 tcp_debug (196 ) IP[] TCP 
tcpiphdr TCP tcpcb TCP 
trpt trpt 
(Net/3 ) 25-28 RTT 























































































































































































































Chinaspub.com a AH 






















































































































































































































































































































































































































































































































































































































































































































































































































































































tcp_debug.h 
35 struct tcp_debug { p- 8 
36 ntime td time; /* iptime(): ms since midnight, UTC */ 
37 short td act; /* TA_xxx value (Figure 27.25) */ 
38 short td_ostate; /* old state */ 
39 caddr_t td tcb; /* addr of TCP connection block */ 
40 struct tcpiphdr td ti; /* IP and TCP headers */ 
41 short td reg; /* PRU xxx value for TA USER */ 
42 struct tcpcb td cb; /* TCP connection block */ 
43 ); 
53 #define TCP NDEBUG 100 
54 struct tcp debug tcp debug[TCP NDEBUG]; 
55 int tcp debx; 
tcp. debug.h 
[] 27-24 tcp debug [] JJ 
53-55 27-24 tcp_debug 
(tcp_debx) UUL 20 000[ 
DO tcp trace 40 [| DI OD td aert i l U LU 
o 27-250 0 
td-act O U O O 
TA_DROP OOO0000000000 tep input O [ 29-27 
TA INPUT 0000000000 Cep output] O [] 29-26 
TA OUTPUT 00 ip output 000000 [] 26-32 
TA USER RPU xxx[] U HH B] HH BH D] HH D]. tep vsr real) Ü [] 30-1 
DJ 27-25 td act 00000 teo tree DI 
27-26 tcp trace |] Ú | L| 
48-133 00090 ostatel] 000001 U ¢ L 
[] ) L 0 27-25 TA_OUTPUT 
0 3| 
tcp. debug.c 
48 void Pp- 8 


49 tcp_trace(act, ostate, tp, ti, req) 
50 short act, ostate; 

51 struct tcpcb *tp; 

52 struct tcpiphdr *ti; 


53 int req; 

54 ( 

55 tcp_seq seq, ack; 

56 int len, flags; 

57 struct tcp_debug *td = &tcp_debug[tcp_debx++]; 

58 if (tcp_debx == TCP_NDEBUG) 

59 tcp_debx = 0; /* circle back to start */ 
60 td->td_time = iptime(); 

61 td->td_act = act; 


0 27-26 tcp trace [JO00000000000000 





WA en China-pub.com 
LT ett A "eem 





































































































































































































































































































































































































































































































































































































































































































































































































































































































62 td->td ostate = ostate; 

63 td->td_tcb = (caddr t) tp; 

64 if (tp) 

65 td->td cb = *tp; /* structure assignment */ 

66 else 

67 bzero((caddr t) & td->td cb, sizeof(*tp)); 

68 if (ti) 

69 td->td ti = *ti; /* structure assignment */ 

70 else 

71 bzero((caddr t) & td->td ti, sizeof(*ti)); 

72 td->td req = req; 

73 #ifdef TCPDEBUG 

74 if (tcpconsdebug -- 0) 

75 return; 

E S 
132 #endif 
133 } 
tcp_debug.c 
U 27-26 (0) 
U U 0 U 


U 27-270 D O tepdumpl[| 000400002512 D 00 D 000000000000 
U U 0 000 (0100 A000 tcpdump DU EH D U U 0 0 
1 0.0 bsdi.1025 > vangogh.discard: S 20288001:20288001(0) 
win 4096 <mss 512> 


2 0.362719 (0.3627) vangogh.discard > bsdi.1025: S 3202722817:3202722817(0) 
ack 20288002 win 8192 
<mss 512> 


3 0.364316 (0.0016) bsdi.1025 > vangogh.discard: . ack 1 win 4096 
4 0.415859 (0.0515) bsdi.1025 > vangogh.discard: . 1:513(512) ack 1 win 4096 


0 27-27 [D D 25-280 0 O tcedump UD 


0272870000000 tret 0000 


027280000000 tret 00000000000 32bip 0000000 
p0000(xe0000000000000)000tre:0 16000000000 
U 100 D 0 0 0 D'U 0 252800000000 t rtt[] t_rxtcur D Dn D D tret 
U U 


953738 SYN SENT: output 20288001:20288005(4) @0 (win=4096) 
<SYN> -> SYN SENT 
rev nxt 0, rev wnd 0 
snd una 20288001, end nxt 20288002, snd max 20288002 
snd wll 0, snd w12 0, snd wnd 0 
REXMT=12 (t rxtshift=0), KEEP=150 


O 27-28 000 25-280 O O tree 0 D] 


Chi a-bubıcoN 





27 TCP 735 






































t_rtt=1, t srtt=0, t_rttvar=24, t_rxtcur=12 


953739 CLOSED: user CONNECT -> SYN_SENT 
rcv nxt 0, rcv wnd 0 
snd una 20288001, snd nxt 20288002, snd max 20288002 
snd_wl1 0, snd w12 0, snd wnd 0 
REXMT-12 (t rxtshift-0), KEEP-150 
t rtt-1, t_srtt=0, t rttvar-24, t rxtcur-12 


954103 SYN SENT: input 3202722817:3202722817(0) 020288002 (win=8192) 
<SYN,ACK> -» ESTABLISHED 
rcv nxt 3202722818, rcv wnd 4096 
snd una 20288002, snd nxt 20288002, snd max 20288002 
snd wll 3202722818, end wl2 20288002, snd wnd 8192 
KEEP-14400 
t rttz0, t srtt-16, t rttvar-4, t rxtcur=6 


954103 ESTABLISHED: output 20288002:20288002(0) 83202722818 (win-4096) 
<ACK> -» ESTABLISHED 
rcv nxt 3202722818, rcv wnd 4096 
snd una 20288002, end nxt 20288002, snd max 20288002 
snd wll 3202722818, snd wl2 20288002, snd wnd 8192 
KEEP-14400 
t rtt=0, t srtt-16, t rttvar-4, t rxtcur-6 


954153 ESTABLISHED: output 20288002:20288514(512) 83202722818 (win-4096) 
«ACK» -» ESTABLISHED 
rcv nxt 3202722818, rcv wnd 4096 
snd una 20288002, snd nxt 20288514, snd max 20288514 
snd_wl1 3202722818, snd w12 20288002, snd wnd 8192 
REXMT-6 (t rxtshift-0), KEEP-14400 
t rtt-1, t srtt-16, t rttvar-4, t rxtcur-6 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































O 27-28 ([]) 
953 738 SYN 8 
6 (20 288 005) SYN 4 
MSS 6[] (REXMT) 75[] (KEEP) 
500 ms t rtt 1 RTT 
SYN connect 
connect SYN TCP 
PRU CONNECT tcp trace 
connect CLOSED SYN SYN SENT 
954 103 365 ms (tcpdump 362.7ms) 
25-28 " (ms)” SYN[] ACK 
SYN SENT ESTABLISHED RTT 
SYN ACK 
(rtt 0) 954 103 connect 
write TCP 
954 153 50 ms 
50 20 288 002 3 
write 3 





























































































































































































































73 6 TCP/IP 



























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































2 
TCP PRU END PRU SEND 
512 3 TCP 
4 25-28 TCP 4096 
mbu | 1024 
si an 
TCP 
TCP FIN 4 
RST 
8 3 6 
RTT 
MTU 

TCP ICMP == TCP Net/3 
ICMP Berkeley 

TCP TCP TCP 

SO_DEBUG tcpdump 

U U 

27.1 27-1 errno 0 

27.2 rmx rtt | 

27.3 (U 27-3) 

FTP 
27-4 FTP 


























































































































































































































Ais 


1281 TOPO OD 


28.1 UI 















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP tcp_input 1100 
Net/3 RFC 793 
TCP ipintr( 
pr input ) tcp input tcp input 
28-1 tcp input 
RST ACK 
( ) 
PCB “ (header prediction)" (28.40 ) 
TCP 
tcp input 
" dodata” 
tcp output 













































































void 
tcp input() 
f : 

checksum TCP header and data; 
findpcb: 

locate PCB for segment; 

if (not found) 

goto dropwithreset; 


reset idle time to 0 and keepalive timer to 2 hours; 
process options if not LISTEN state; 


if (packet matched by header prediction) { 
completely process received segment; 
return; 


J 


switch (tp-»t state) { 

case TCPS LISTEN: 
if SYN flag set, accept new connection request; 
goto trimthenstep6; 


case TCPS SYN SENT: 
if ACK of our SYN, connection completed; 
trimthenstepó: 
trim any data not within window; 


Q 28-1 TCPOOOOOU0U 









































738 TCP/IP 02 China+pub.tom 
— EE 


goto step6; 
} 


process RFC 1323 timestamp; 
check if some data bytes are within the receive window; 


trim data segment to fit within window; 


if (RST flag set) { 
process depending on state; 
goto drop; 
3 /* Chapter 28 finishes here */ 


if (ACK flag set) { /* Chapter 29 starts here */ 
if (SYN RCVD state) 
simultaneous open complete; 
if (duplicate ACK) 
fast recovery algorithm; 
update RTT estimators if segment timed; 
open congestion window; 
remove ACKed data from send buffer; 
change state if in FIN WAIT 1, CLOSING, or LAST ACK state; 
} 


step6: 
update window information; 


process URG flag; 


dodata: 
process data in segment, add to reassembly queue; 


if (FIN flag is set) 
process depending on state; 


if (SO_DEBUG socket option) 
tcp trace (TA INPUT); 


if (need output || ACK now) 
tcp output (); 
return; 


dropafterack: 
tcp_output() to generate ACK; 
return; 


dropwithreset: 
tcp_respond() to generate RST; 
return; 


drop: 
if (SO_DEBUG socket option) 
tcp trace(TA DROP); 
































































































































































































































































































































































































































return; 
] 
U 28-1 (0) 
0 3 IUU OD dropafterack 
dropwithreset[] drop | | “ drop” g Ol 
dropwithreset RST 
switch LISTEN 
SYN_SENT SYN | trimthenstep6 
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step 6] 
28.2 000 
28-2 TCP 
1. mbu IP[] TCP 
170-204 iphlen IP IP 20 
IP ip stripoptions TCP IP 
IP (9.60 ) TCP (O 28-7) mbuf| 
IP/TCP (40 ) m pullup 40 
mbuf 
tcp_input.c 
170 void P-P 
171 tcp input (m, iphlen) 
172 struct mbuf *m; 
173 int iphlen; 
174 { 
175 struct tcpiphdr “ti; 
176 struct inpcb *inp; 
177 caddr_t optp = NULL; 
178 int optlen; 
179 int len, tlen, off; 
180 struct tcpcb *tp = 0; 
181 int tiflags; 
182 struct socket *so; 
183 int todrop, acked, ourfinisacked, needoutput = 0; 
184 short ostate; 
185 struct in_addr laddr; 
186 int dropsocket = 0; 
187 int iss = 0; 
188 u_long tiwin, ts_val, ts_ecr; 
189 int ts_present = 0; 
190 tcpstat.tcps_rcvtotal++; 
191 /* 
192 * Get IP and TCP header together in first mbuf. 
193 * Note: IP leaves IP header in first mbuf. 
194 */ 
195 ti = mtod(m, struct tcpiphdr +); 
196 if (iphlen > sizeof(struct ip)) 
197 ip stripoptions(m, (struct mbuf *) 0); 
198 if (m->m len < sizeof(struct tcpiphdr)) { 
199 if ((m = m pullup(m, sizeof(struct tcpiphdr))) == 0) ( 
200 tcpstat.tcps rovshort++; 
201 return; 
202 ) 
203 ti = mtod(m, struct tcpiphdr +); 
204 ) š 
tcp_input.c 
0 28-2 tcp input [0000000000 
28-3 TCP 
2: TCP 
205-217 tlen[] TCP IP IP 

































































































































































740 
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TCP/IP 2 
ip_len IP len IP 
TCP 
23-19 
tcp_input.c 
205 /* Wem 
206 * Checksum extended TCP header and data. 
207 */ : 
208 tlen - ((struct ip *) ti)-»ip len; 
209 len = sizeof(struct ip) + tlen; 
210 ti->ti next = ti->ti prev = 0; 
211 ti-»ti xl = 0; 
212 ti-»ti, len = (u short) tlen; 
213 HTONS(ti-»ti len); 
214 if (ti->ti sum = in cksum(m, len)) { 
215 tcpstat.tcps revbadsum++; 
216 goto drop; 
217 } 
218 /* 
219 * Check that TCP offset makes sense, 
220 * pull out TCP options and adjust length. XXX 
221 */ 
222 off = ti->ti_off << 2; 
223 if (off < sizeof(struct tcphdr) || off > tlen) ( 
224 tepstat.tcps_rcvbadoff++; 
225 goto drop; 
226 } 
227 tlen -= off; 
228 ti->ti_len = tlen; ; 
tcp input.c 
U 28-3 tcp input 00000 TCFD D D DI LI UI D l 
3. TCP 
218-228 TCP ti Off 32 bit TCP 
TCP A TCP ) 
TCP 2000) TCP 
TCP tlen ( 0) 
tlen TCP ti_len 
28-4 TCP 
tcp_input.c 
229 if (off > sizeof (struct tcphdr)) I 
230 if (m->m len < sizeof(struct ip) + off) { 
231 if ((m =.m pullupím, sizeof(struct ip) + off)) == 0) { 
232 tcpstat.tcps rovshort++; 
233 return; 
234 ) 
235 ti = mtod(m, struct tcpiphdr *); 
236 } 
237 optlen = off - sizeof(struct tcphdr); 
238 optp = mtod(m, caddr t) + sizeof (struct tcpiphdr); 
239 /* 
240 * Do quick retrieval of timestamp options ("options 


U 28-4 tcp input 00000000 Tero O 
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241 * prediction?"). If timestamp is the only option and it’s 
242 * formatted as recommended in RFC 1323 Appendix A, we 
243 * quickly get the values now and not bother calling 
244 * tep_dooptions(), etc. 
245 */ 
246 if ((optlen == TCPOLEN TSTAMP APPA || 
247 (optlen > TCPOLEN TSTAMP APPA && 
248 Optp[TCPOLEN TSTAMP APPA] == TCPOPT EOL)) && 
249 *(u long *) optp -- htonl(TCPOPT TSTAMP HDR) && 
250 (ti-»ti flags & TH SYN) -- 0) ( 
251 ts present - 1; 
252 ts val = ntohl(*(u long *) (optp + 4)); 
253 ts ecr - ntohl(*(u long *) (optp « 8)); 
254 optp = NULL; /* we've parsed the options */ 
255 ) 
256 ) n 
tcp. input.c 
U 28-4 ([]) 
4. [] IP[] TCP mbuf 
230-236 20 TCP m pullup IP 
TCP TCP mbu 3 80 
(20+20+40) mbu 
m pullup IP 20 TCP 
TCP m_pullup 
28-2 m_pullup tcps_rcvshort 
tcps rcvshort 24-5 
TCP 0 
5. 
237-255 optlen TCP optp 
3 
1) TCP 12(TCPOLEN TSTAMP APPA) TCP 12 
optp[12] 
2) 4 0x0101080a(TCPOPT TSTAMP HDR 26.6 ) 
3) SYN ( 
) 
ts present 1 
ts vall| ts_ecr|| optp 
tcp dooptions 
SYN (MSS ) 
28-5 Internet PCB 
6. 
257-264 (SYN[] FINI] ) tiflags 
TCP 16 bit 32 bit 









































































































































































































































742 rowan u: China"pub.tom 
A pg] 






















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































16 bit Internet PCB 
- - - tcp_input.c 
257 tiflags = ti->ti flags; 
258 /* 
259 * Convert TCP protocol specific fields to host format. 
260 */ 
261 NTOHL(ti-»ti seg); 
262 NTOHL (ti->ti_ack) ; 
263 NTOHS (ti->ti win); 
264 NTOHS (ti->ti urp); 
265 /* 
266 * Locate pcb for segment. 
267 XZ 
268 findpcb: 
269 inp = tcp last inpcb; 
270 if (inp->inp_lport !- ti->ti_dport || 
271 inp->inp_fport != ti->ti sport |. 
272 inp->inp_faddr.s_addr != ti->ti_src.s_addr || 
273 inp->inp_laddr.s_addr != ti->ti_dst.s_addr) { . 
274 inp = in pcblookup(&tcb, ti-»ti src, ti->ti sport, 
275 ti-»ti dst, ti->ti dport, INPLOOKUP WILDCARD) ; 
276 if (inp) I 
277 tcp last inpcb = inp; 
278 T-tcpstat.tcps pcbcachemiss; 
279 } : 
tcp input.c 
[] 28-5 tcp input 000000000 Internet PCB 
Së Internet PCB 
265-279 TCP (tcp last inpcb) PCB 
UDP TCP PCB 4 
udp input TCP in pcblookup 
PCB 
TCP UDP (wildcard 
entry) 
4 24-5 
80% 
28-6 
tcp input.c 
280 /* iod 
281 * If the state is CLOSED (i.e., TCB does not exist) then 
282 * all data in the incoming segment is discarded. 
283 * If the TCB exists but is in CLOSED state, it is embryonic, 
284 * but should either do a listen or a connect soon. 
285 */ 
286 if (inp == 0) 
287 goto dropwithreset; 
288 tp = intotcpcb(inp); 





U 28-6 tcp input I000000000000 





China-pub.toM mus 743 






































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































289 if (tp == 0) 
290 goto dropwithreset; 
291 if (tp-»t state == TCPS CLOSED) 
292 goto drop; 
293 /* Unscale the window into a 32-bit value. */ 
294 if ((tiflags & TH SYN) -- 0) 
295 tiwin = ti->ti win << tp-»snd scale; 
296 else 
297 tiwin - ti-»ti win; : 
tep input.c 
U 28-6 (1) 
8. RST 
280-287 PCB RST TCP 
SYN RST 
UDP ICMP 
288-290 PCB TCP (tcp. close 
TCP PCB) RST 
9. 
291-292 TCP CLOSED 
connect listen 
bind 
listen SYN 
10. 
293-297 
SYN 
TCP tiwin 16 bit 
32 bit 
28-7 SO DEBUG 





























































































































































































































































































































398 LoL ËCH input.c 


298 SO - inp-»inp socket; 

299 if (so-»so options & (SO DEBUG | SO ACCEPTCONN)) { 
300 if (so-»so options & SO DEBUG) ( 

301 ostate - tp-»t state; 

302 tcp saveti = *ti; 

303 } 

304 if (so->so_options & SO_ACCEPTCONN) { 

305 SO = sonewconn (so, 0); 

306 if (so == 0) 

307 goto drop; 

308 /* 

309 * This is ugly, but .... 

310 * 

311 * Mark socket as temporary until we're 
312 * committed to keeping it. The code at 
313 * 'drop' and 'dropwithreset' check the 


028-7 tcp input J0000000000000000 








744 


314 
315 
316 
317 
318 
319 
320 
321 
322 
323 
324 
325 
326 
327 


328 
329 
330 
331 
332 


333 } 


TCP/IP 


#endif 


} 





China=pubecom 









































* flag dropsocket to see if the temporary 
* socket created here should be discarded. 
* We mark the socket as discardable until 
* we’re committed to it below in TCPS_LISTEN. 


ay 
dropsocket++; 
inp = (struct inpcb +) so->so pcb; 


ti->ti_dst; 
ti->ti_dport; 


inp->inp_laddr 
inp->inp_lport 


#if BSD>=43 


inp->inp_options ip_srcroute(); 


intotcpcb (inp); 
TCPS_LISTEN; 


tp 
tp->t_state 


/* Compute proper scaling value from buffer space */ 
while (tp->request_r_scale < TCP_MAX_WINSHIFT && 
TCP_MAXWIN << tp->request_r_scale < so->so_rcv.sb_hiwat) 
tp->request r scale++; 


IT cp input.c 




















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































[] 28-7 (0) 
11. IP[] TCP 
300-303 SO DEBUG (ostate)[] IP[] TCP 
(tcp_saveti) tcp trace([] 29-26) 
12. 
304-319 (listen SO. ACCEPTCONN) 
sonewconn PRU_ATTACH ([] 30-2) Internet PCB[] TCP 
TCP ( 
SYN) dropsocket “ drop” 
" dropwithreset" 
320-326 inp[] tp TCP 
TCP 
ip_srcroute mbuf inp_options 
TCP tcp_output ip_output 
327 LISTEN SYN 28-16 
13. 
328-331 
(655351) TCP_MAXWIN) 65535 
(14[] TCP MAX WINSHIFT) 
listen SO RCVBUF 
tcp recvspace 
14 65535x 2" 1 073 725 440 
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(Net/3 2626 144) 14 
28.1[] 28.2 
28-8 TCP 

tcp_input.c 

334 /* cpmp 

335 * Segment received on connection. 

336 * Reset idle time and keepalive timer. 

337 */ 

338 tp->t idle = 0; 

339 tp->t timer [TCPT KEEP] = tcp keepidle; 

340 /* 

341 * Process options if not in LISTEN state, 

342 * else do it below (after getting remote address). 

343 e 

344 if (optp && tp->t state != TCPS LISTEN) 

345 tcp dooptions(tp, optp, opt len, ti, 

346 &ts present, &ts val, &ts ecr); , 
tcp input.c 

0 28-8 tcp incu t(][] Lu 0 0 0. B. 0 D LI 1.9 0 BB HBD BBB DD DB 
14. 
334-339 t idle 0 2 
15. TCP 
340-346 TCP LISTEN tcp_dooptions 
RFC 1323 A 28-4 optp 
TCP PCB tcp_dooptions 
MSS 28-17 

























































































































































































28.3 tcp_dooptions]|] |] 
























































Net/3 5[] TCP (U 26-4)[] EOL[] NOP[] MSS 

















































































































28-9 
































———————— —— "————————— . 
1213 void tcp input.c 


1214 tcp dooptions(tp, cp, cnt, ti, ts present, ts val, ts ecr) 
1215 struct tcpcb *tp; 
1216 u char *cp; 


1217 int ent; 
1218 struct tcpiphdr *ti; 
1219 int *ts_present; 
1220 u long *ts val, *ts_ecr; 
1221 ( 
1222 u short mss; 
1223 int opt, optlen; 
1224 for (; ent > 0; ent -= optlen, cp += optlen) { 
1225 opt = cp[0]; 
1226 if (opt == TCPOPT_EOL) 


[] 28-9 tcp dooptions 00000 EOLO NOPD O 


746 
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TCP/IP 2 
1227 break; 7 
1228 if (opt == TCPOPT_NOP) 
1229 optlen = 1; 
1230 else { 
1231 optlen = cp[1]; 
1232 if (optlen <= 0) 
1233 break; 
1234 } 
1235 switch (opt) { 
1236 default: 
1237 continue; 
— —————— tp input.c 
O 28-9 (0) 
1. 
1213-1229 TCP EOL( ) 
NOP 1 (U) 26-16) switch 
default 
1230-1234 optlen|| 
Net/3 TCP 
1) (NOP[] EOL 
) for optlen 
2) switch default U U 
28-10 tcp_dooptions MSS uu 
2. MSS 
1238-1246 A(TCPOLEN. MAXSEG) SYN 
MSS tcp mss 
tcp mss TCP t maxseg 
3, 
1247-1254 A(TCPOLEN WINDOW) SYN 
Net/3 TF RCVD SCALE U 
requested_s_scale cp[2] 
ESTABLISHED 
4. | 
1255-1273 10(TCPOLEN TIMESTAMP) 
ts present 1 ts vall| ts ecr 
SYN Net/3 TF RCVD TSTMP 
ts recent ts recent age tcp now 
500ms 
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U 28-10 tcp_dooptions UUDUDUDUMasnUDHUDUUDUDUUD 











































































































































































































































































































































































































28.4 [|] ÜU Ú 
28-8 tcp_input 
Van Jacobson 4.3BSD Reno 
[Jacobson 1990b] 3 
1) TCP ACK 
2) TCP 
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TCP/IP 2 
[Partridge 1993] Van Jacobson TCP 
28-11 
tcp_input.c 
347 pe Ta 
348 * Header prediction: check for the two common cases 
349 * of a uni-directional data xfer. If the packet has 
350 * no control flags, is in-sequence, the window didn’t 
351 * change and we're not retransmitting, it’sa 
352 * candidate. If the length is zero and the ack moved 
353 * forward, we're the sender side of the xfer. Just 
354 * free the data acked & wake any higher-level process 
355 * that was blocked waiting for space. If the length 
356 * is non-zero and the ack didn't move, we’re the 
357 * receiver side. If we're getting packets in order 
358 * (the reassembly queue is empty), add the data to 
359 * the socket buffer and note that we need a delayed ack. 
360 */ 
361 if (tp->t state == TCPS_ESTABLISHED && 
362 (tiflags & (TH SYN | TH FIN | TH_RST | TH URG | TH ACK)) == TH_ACK && 
363 (!ts present || TSTMP GEQ(ts val, tp-»ts recent)) && 
364 ti-»ti seq -- tp-»rcv nxt && 
365 tiwin kk tiwin == tp->snd wnd && 
366 tp->snd_nxt == tp-»snd max) { 
367 SCH 
368 * If last ACK falls within this segment’s sequence numbers, 
369 * record the timestamp. 
370 */ 
371 if (ts present && SEQ LEQ(ti->ti seq, tp->lastack sent) && 
372 SEQ LT(tp->last ack sent, ti->ti_seq + ti->ti len)) ( 
373 tp->ts recent age = tcp now; 
374 tp->ts recent = ts val; 
375 ) » 
tcp input.c 
[] 28-11 tcp input [00000000000 
1. 
347-366 6 
ACK 
1) ESTABLISHED 
2) 4 SYNI FIN[] RST URG ACK 
TCP[] 6 ACK 4 PSH 
( ESTABLISHED RST ACK 
) 
3) (ts_val) 
(ts_recent) PAWS 28.7 PAWS 
ts_val ts_recent 
(Net/3 tcp_now) 
Net/3 500 ms 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































(tep_nowW)| D B D B. UI D LU LU U U U U U U U U 0) u LU LU U U U U LU 
O Wl 64 bit 32 bit Uu 32 bit] EL EL E] E] uuu 64 
bit] [] LL D D] HL 1 ODO 
400000000 (ti seg) U U U U U UU (rev. nxt)[ O O 
LU U U LU U U U 0 ui i 
50000 OO (tiwin) 00000 (snd_wnd) 
6) (snd nxt) 000000 OO (sna ma) 0000000 
2. OM ts recent 
367-375 DOO0O000000000000 26-180 000 O 
O O (ts val) ts_recent ts_recent_age (tcp_now) 
26-18 UD | 26-20 
OOOOOOOOOOODOOOOODOOD DO U 00 26-200 O TstMP GEO [] 
L UT TT T T) 28-00 JOU OU it 0 | u L 
U 28-121] [ | uu uu LU U U U U U U 00 0 LU LU U U U 
ACKT 
tcp_input.c 
376 if (ti->ti_len == 0) { 
377 if (SEQ GT(ti-»ti ack, tp->snd una) && 
378 SEQ.LEQ(ti->ti_ack, tp->snd max) && 
379 tp->snd_cwnd >= tp-»snd wnd) { 
380 /* 
381 * this is a pure ack for outstanding data. 
382 */ 
383 ++tcpstat.tcps predack; 
384 if (ts present) 
385 tcp_xmit_timer(tp, tcp now - ts ecr + 1); 
386 else if (tp-»t rtt && 
387 SEQ GT(ti-»ti ack, tp-»t rtseq)) 
388 tcp xmit timer(tp, tp-»t, rtt); 
389 acked = ti->ti_ack - tp-»snd una; 
390 tcpstat.tcps rcvackpack-*; 
391 tcpstat.tcps rcvackbyte += acked; 
392 sbdrop(&so-»so snd, acked); 
393 tp->snd una = ti-»ti ack; 
394 m freem(m); 
395 /* 
396 * If all outstanding data is acked, stop 
397 * retransmit timer, otherwise restart timer 
398 * using current (possibly backed-off) value. 
399 * If process is waiting for space, 
400 * wakeup/selwakeup/signal. If data 
401 * is ready to send, let tcp output 
402 * decide between more output or persist. 
403 e El 
404 if (tp-»snd una == tp-»snd max) 
405 tp->t timer[TCPT REXMT] = 0; 


[]28-12 tcp imw JO000000000000 


750 
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TCP/IP 2 
406 else if (tp->t_timer[TCPT_PERSIST] == 0) 
407 tp->t_timer[TCPT_REXMT] = tp->t_rxtcur; 
408 if (so->so_snd.sb_flags & SB_NOTIFY) 
409 sowwakeup (so) ; 
410 if (so->so_snd.sb_cc) 
411 (void) tcp_output (tp); 
412 return; 
xia : tcp. input.c 
O 28-12 ([]) 
3.[] ACK 
376-379 4 ACK 
1) (ti_len 0) 
2) (ti_ack) (snd_una) = 
"Ll ” | ACK | | 
3) (ti ack) (snd maz) 
4) (snd wnd) 
4. RTT 
384-388 L L L L L L 
tcp_xmit_timer RTTU U 
5: 
389-394 acked sbdrop 
(snd una) 
mbuf| ( 0 mbuf) 
6. 
395-407 (snd una snd max) 
t rxtcur 
tcp output BE 
U U U U | 
U U 
7. 
408-409 sowwakeup 
16-5 0 | | select |] 
O SIGIO[] [] SB. NOTIFY U 
8. 
410-411 tcp_output 
snd_una snd_wnd 24-17 
28-13 
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414-416 4 
D (ti_1eN0 9 0 28-12 if else 
2) (ti_ack) 
3) (seq_next tp) 
4) 
10. 
423-435 (rcv_nxt) mbu IP TCP 
TCP mbu sorwakeup 
TCP_REASS 
ACK 
- i a tcp_input.c 
414 } else if (ti->ti_ack == tp->snd una && 
415 tp->seg_next == (struct tcpiphdr *) tp && 
416 ti->ti_len <= sbspace (&so->so_rcv)) { 
417 /* 
418 * this is a pure, in-sequence data packet 
419 * with nothing on the reassembly queue and 
,420 * we have enough buffer space to take it. 
421 */ 
422 ++tcpstat.tcps_preddat; 
423 tp->rcv_nxt += ti->ti len; 
424 tcpstat.tcps rcvpack++; 
425 tcpstat.tcps rcvbyte += ti->ti len; 
426 ZS 
427 * Drop TCP, IP headers and TCP options then add data 
428 * to socket buffer. 
429 */ 
430 m-»m data += sizeof (struct tcpiphdr) + off - sizeof (struct tcphdr); 
431 m-»m len -= sizeof (struct tcpiphdr) + off - sizeof(struct tcphdr); 
432 sbappend (£so->so_rcv, m); - 
433 sorwakeup (so); 
434 tp->t flags |= TF DELACK; 
435 return; 
436 ) 
437 } i 
tcp_input.c 
D 28-13 tcp inam J000000000000 
LAN(bdsi 
svr4 ) WAN(vangogh.cs.berkeley.edu 
ftp.uu.net ) netstat 24-5 
LAN ACK 
97% -100% WAN 8370-9990 
TCP PCB 





























































































































































































































75 2 TCP/IP 2 
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28.5 TCPD D D D 0 0 00 0 U 











































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































tcp input 28-14 
tcp_input.c 
438 /* Br 
439 * Drop TCP, IP headers and TCP options. 
440 */ 
441 m-»m data += sizeof (struct tcpiphdr) + off - sizeof(struct tcphdr) ; 
442 m->m len -= sizeof (struct tcpiphdr) + off - sizeof (struct tcphdr); 
443 FE 
444 * Calculate amount of space in receive window, 
445 * and then do TCP input processing. 
446 * Receive window is amount of space in rcv queue, 
447 £ but not less than advertised window. 
448 */ 
449 { 
450 int win; 
451 win = sbspace (&so->so_rcv); 
452 if (win < 0) 
453 win = 0; 
454 tp->rev wnd = max(win, (int) (tp->rcv adv - tp->rcv_nxt)); 
455 } : 
tcp input.c 
[] 28-14 tcp input 00000 IPO TCP] DQ 
1. IP[] TCP TCP 
438-442 mbu mbu IP TCP 
TCP off TCP TCP TCP 
(20 ) 
2. 
443-455 win rcv adv rcv nxt 
win TCP win 


















































































































































































































































































































































































































































































































































28.6 U UU UU 00000 U 











LISTEN SYN SENT 
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28.6.1 
LISTEN 28-15 tpl inp 28-7 
- tcp input.c 
456 switch (tp->t state) ( 
457 /* 
458 * If the state is LISTEN then ignore segment if it contains an RST. 
459 * If the segment contains an ACK then it is bad and send an RST. 
460 * If it does not contain a SYN then it is not interesting; drop it. 
461 * Don't bother responding if the destination was a broadcast. 
462 * Otherwise initialize tp-»rcv nxt, and tp-»irs, select an initial 
463 * tp-»iss, and send a segment: 
464 ba <SEQ=ISS><ACK=RCV_NXT><CTL=SYN, ACK> 
465 * Also initialize tp->snd nxt to tp->iss+l and tp->snd una to tp->iss 
466 * Fill in remote peer address fields if not previously specified. 
467 * Enter SYN_RECEIVED state, and process any other fields of this 
468 * segment in this state. 
469 *7 
470 case TCPS LISTEN: { 
471 struct mbuf *am; 
472 struct sockaddr in “sin; 
473 if (tiflags & TH,RST) 
474 goto drop; 
475 if (tiflags & TH ACK) 
476 goto dropwithreset; 
477 if ((tiflags & TH SYN) -- O0) 
478 goto drop; : 
tcp input.c 
0 28-15 teo input OOOOOOO000000000 SYN 
1. RST[] ACK SYN 
473-478 RST ACK 
RST ( SYN ACK ) 
SYN case LISTEN SYN 
SYN_RCVD 
28-16 case 
479 /* tcp input.c 
480 * RFC1122 4.2.3.10, p. 104: discard bcast/mcast SYN 
481 * in broadcast() should never return true on a received 
482 * packet with M BCAST not set. 
483 */ 
484 if (m-»m flags & (M BCAST | M MCAST) || 
485 IN MULTICAST(ti->ti der. a | addr)) 
486 goto drop; 
487 am = m get (M DONTWAIT, MT SONAME); /* XXX */ 
488 if (am -- NULL) 
489 goto drop; 
490 am->m len = sizeof(struct sockaddr in); 


0 28-16 tcp input J000000000000 SYND DD 












































754 TCP/IP 2 China-pub.tom 
— en SS 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































491 sin = mtod(am, struct sockaddr_in *); 
492 sin->sin_family = AF_INET; 
493 sin->sin_len = sizeof(*sin); 
494 sin->sin_addr = ti->ti_src; 
495 sin->sin_port = ti->ti_sport; 
496 bzero((caddr t) sin->sin zero, sizeof(sin-»sin zero)); 
497 laddr = inp->inp laddr; 
498 if (inp->inp laddr.s addr == INADDR ANY) 
499 inp->inp laddr = ti->ti_dst; 
500 if (in_pcbconnect (inp, am)) { 
501 inp->inp_laddr = laddr; 
502 (void) m_free (am); 
503 goto drop; 
504 } 
505 (void) m_free (am); å 
tcp input.c 
H 28-16 ([]) 
2. 
479-486 TCP 
ether_input M_BCAST|| M MCAST 
IN MULTICAST IP D 
in broadcast Net/l ( ) 
IP Net/2 
ether_input M_BCAST|| M_MCAST 
Net/3 in broadcast 
IP IP 
in broadcast Net/3 
IP 28- 
16 
IN_MULTICAST 
3. IP mbuf 
487-496 mbu sockaddr_in IP 
IP IP TCP 
PCB mbu 
“ XXX” mbu in_pcbconnect 
tcp_input 24-5 
%2 
4. PCB 
497-499 laddr ( 
IP PCB 
IP 
laddr 28-7 IP 
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5. PCB 
500-505 in_pcbconnect PCB PCB 
mbu 
28-17 case 
tcp input.c 
506 tp->t template = tcp_template(tp); 
507 if (tp->t template == 0) { 
508 tp = tcp_drop(tp, ENOBUFS); 
509 dropsocket = 0; /* socket is already gone */ 
510 goto drop; 
511 } 
512 if (optp) 
513 tcp_dooptions(tp, optp, optlen, ti, 
514 &ts_present, &ts_val, &ts_ecr); 
515 if (iss) 
516 tp->iss = iss; 
517 else 
518 tp->iss = tcp_iss; 
519 tcp iss += TCP ISSINCR / 2; 
520 tp-»irs = ti-»ti seq; 
521 tcp sendseqinit (tp); 
522 tcp rcvseginit (tp); 
523 tp->t flags |= TF ACKNOW; 
524 tp->t state = TCPS SYN RECEIVED; 
525 tp->t, timer [TCPT KEEP] = TCPTV KEEP INIT; 
526 dropsocket - 0; /* committed to socket */ 
527 tcpstat.tcps_accepts++; 
528 goto trimthenstep6; 
529 } : 
tcp input.c 
U 28-17 tcp input [0000 LISTEN] 0.0 0 0 SYNU D 0 D 0 D 
6. IP[] TCP 
506-511 tcp template IP[] TCP 28-7 Sonewconn 
PCB[] TCP 
7. TCP 
512-514 TCP tcp_dooptions 28-8 
tcp_dooptions LISTEN TCP PCB 
(tcp_mss ) tcp_dooptions 
(0 0 MSS ID 
ID) 
8. ISS 
515-5139 tcp iss 64 000 
(TCP. ISSINCR 2) iss iss tcp iss 





































































































































































































iss 


. IP 128.1.2.3 27 
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192.3.4.5 









































3000 























(128.1.2.3, 27, 1 


























TIME_WAIT 






































TCP 




















100 000 




























































































TIME_WAIT 





























































































































SYN[] TCP 














TIME 


| (192.3.4.5, 














WAIT 




















PCB 
































PCB 


SYN 















































200 000 
















































































LISTEN 














































































































28-28 






























































SYN 



































(200 000) 
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(2) 











TIME WAIT 












































(100 000) 















































TCP ) 





















































findpcb( 


28-5) 

















PCB( 
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228 000) 



































tcp 


















































































































































































































































connectl|] 


























iss 

















64 000( 





30-4) 
































































































































500 ms 

























































































tcp iss) 













































































ISS 



























































520-522 






































28-17 
































SYN 

























































































(irs) 


























TCP 



















































































#define tcp_rcvseqinit (tp) N 


(tp) ->rcv_adv = 


(tp) ->rcv_nxt = 


#define tcp sendseqinit(tp) \ 


(tp) ->snd_una = (tp)->snd_nxt = (tp)->snd_max = 


(tp) ->iss 





(tp) ->irs + 1 





SYN 











































































































10 








10. 














SYN 








523-525 

















SYN 































































































SYN RCVD 



































[ [ 








750 






































tcp output 








ACK 


























TF ACKNOW 


(tp) ->snd_up = \ 

































































(TCPTV_KEEP_INIT) 











TF_ACKNOW 





























24-16 






































tcp_outflags 







































































SYN 








526-528 











TCP 


























28-7 



































drop 
































trimthenstep6 
































SYN 


















































SYN 
































































































































28.6.2 


























28-18 


















































ESTABLISHED 




















































































































| SYN_SENT 
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tcp_input.c 
530 /* cp_mp 
531 * If the state is SYN SENT: 
532 * if seg contains an ACK, but not for our SYN, drop the input. 
533 * if seg contains an RST, then drop the connection. 
534 * if seg does not contain SYN, then drop it. 
535 * Otherwise this is an acceptable SYN segment 
536 * initialize tp->rcv_nxt and tp->irs 
537 * if seg contains ack then advance tp->snd_una 
538 * if SYN has been acked change to ESTABLISHED else SYN_RCVD state 
539 * arrange for segment to be acked (eventually) 
540 * continue processing rest of data/controls, beginning with URG 
541 Zë 
542 case TCPS SYN SENT: 
543 if ((tiflags & TH ACEN Eë 
544 (SEQ LEQ(ti->ti ack, tp->iss) || 
545 SEQ GT(ti-»-ti ack, tp->snd max))) 
546 goto dropwithreset; 
547 if (tiflags & TH RST) ( 
548 if (tiflags & TH ACK) 
549 tp - tcp drop(tp, ECONNREFUSED); 
550 goto drop; 
551 } 
552 if ((tiflags & TH SYN) == 0) 
553 goto drop; : 
tcp input.c 
U 28-18 tcp input D JD TJ D DI 0 SYN D U U U B D B 
1. ACK 
530-546 TCP SYN 
; SYN 366 367 
30-4 iss tcp iss 
tcp sendseginit( ) Å A 
ISS 365 28-19 tcp output SYN 
snd una = 365  snd nxt = 366 
snd up 2365 snd maz = 366 
tcp sendseqinit 28-19 4 
im 2 0 28-19 ISSO 0 3650 SYND D D 
365 26-31 SYN 0000000 
366 28-18 
ACK iss(365) snd max(366)[] ACK 
RST SYN SENT ACK 
SYN (simultaneous open)([] 24-15) 
2 RST 
547=551 RST ACK 
ACK( MM RST 
tcp drop so error connect 
3. SYN 
552-533 SYN 
case SYN 



































































































































































































































( ACK) 28-20 tcp_input SYN 

























































































758 
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TCP/IP 2 
i - tcp input.c 
554 if (tiflags & TH ACK) { 
555 tp->snd una = ti->ti ack; 
556 if (SEQ LT(tp->snd nxt, tp->snd una)) 
557 tp->snd nxt = tp->snd una; 
558 } i 
559 tp->t_timer [TCPT_REXMT] = 0; 
560 tp->irs = ti->ti_seg; 
561 tcp rovseginit (tp); 
562 tp->t flags |= TF ACKNOW; 
563 if (tiflags & TH ACK && SEQ GT(tp-»snd una, tp->iss)) ( 
564 tcpstat.tcps_connects++; 
565 soisconnected (so); 
566 tp->t_state = TCPS_ESTABLISHED; 
567 /* Do window scaling on this connection? */ 
568 if ((tp->t flags & (TF_RCVD_SCALE | TF_REO_SCALE)) == 
569 (TF RCVD SCALE | TF REQ SCALE)) { 
570 tp->snd scale = tp->reguested s scale; 
571 tp->rcv scale = tp->request r scale; 
572 } 
573 (void) tcp reass(tp, (struct tcpiphdr *) 0, 
574 (struct mbuf *) 0); 
575 /* 
576 * if we didn't have to retransmit the SYN, 
577 * use its rtt as our initial srtt & rtt var. 
578 SÉ 
579 if (tp->t rtt) 
580 tcp xmit timer(tp, tp-»t rtt); 
581 ) else 
582 tp->t state = TCPS SYN RECEIVED; I 
tcp input.c 
D 28-20 tcp input OO DLL CL 0000000000000 SYN 
4. ACK 
554-558 ACK snd_una 28-19 
snd_una 366 366 snd_nxt 
snd una( 28-19 ) snd nxt snd una 
5. 
559 
ACK 
ACK[] SYN SY 
6. 
560-562 tcp. rcvseqinit[]( 
rcv adv[| rcv. nxt 1 TF ACKNOW 
tcp output rcv nxt([] 26-27) 
SYN 
563—564 ACK snd una ISS 
ESTABLISHED 
28-20 ACK snd_una 
28-18 case if 
ISS ACK| snd una ISS 
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7. 
565-566 soisconnected TCP 
ESTABLISHED 
8. 
567-572 TCP SYN SYN 
snd_scale[] rcv. scale tcp_newtcpcb TCP 
0 0 
9. 
573-574 tcp_reass 
TCP ACK[] SYN 
SYN SENT ESTABLISHED SYN 
dodata TCP ACK 
SYN( ) ACK 
SYN_RCVD ESTABLISHED 
SYN Net/3 Net/3 
10. RTT 
575-580 SYN tcp_xmit_timer SYN 
RTT 
TCP t_rtt TCP 
SYN (U 26-24) | L| | 
SYN ( 28-10[] Net/3[] SYN ) 
TCP t_rtt 
(500ms) t_rtt 
RTT 
( ) 
11. 
581-582 TCP[] SYN SENT ACK[] SYN 
SYN RCVD 
28-21 SYN 28-17 
trimthenstep6 
583 trimthenstep6: tcp input.c 
584 za 
585 * Advance ti->ti seq to correspond to first data byte. 
586 * If data, trim to stay within window, 
587 * dropping FIN if necessary. 
588 */ 


O 28-21 tcp input O 0000 SYND D 0 0 U 


760 








TCP/IP 2 
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589 ti->ti_seq++; 
590 if (ti->ti_len > tp->rcv_wnd) { 
591 todrop = ti->ti_len - tp->rcv_wnd; 
592 m_adj (m, -todrop); 
593 ti->ti_len tp-»rcv. wnd; 
594 tiflags &= "TH FIN; 
595 tcpstat.tcps rovpackafterwin++; 
596 tcpstat.tcps rcvbyteafterwin += todrop; 
597 } 
598 tp->snd wll = ti->ti seg - 1; 
599 tp-»rcv up = ti->ti seq; 
600 goto step6; 
601 } < 
tcp input.c 
I 28-21 (0) 
584-589 1 SYN SYN ti_seq 
12. 
590-597 ti_len 
(ti_len rcv_wnd) m_adj mbuf 
( 2-20) ti len mbuf FIN 
FIN 
SYN 
SYN 
SYN 
SYN 
13. 
598-599 snd wll 1 29-15 3 
snd_wnd[] snd_w11[] snd w12 (rcv. up) 
step6 RFC 793 29-15 
28.7 PAWS LH UU ttl 
28-22 tcp input RFC 1323 
PAWS 26.6 
tcp input.c 
602 /* FAT 
603 * States other than LISTEN or SYN SENT. 
604 * First check timestamp, if present. 
605 * Then check that at least some bytes of segment are within 
606 * receive window. If segment begins before rcv nxt, 
607 * drop leading data (and SYN); if nothing left, just ack. 
608 * i 
609 * RFC 1323 PAWS: If we have a timestamp reply on this segment 
610 * and it’s less than ts_recent, drop it. i 
611 */ 
612 if (ts present && (tiflags & TH_RST) == 0 && tp->ts_recent && 


O 28-22 tcp input D 0 0 0 0 0 0 00 L 
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613 TSTMP LT(ts val, tp-»ts recent)) { 
614 /* Check to see if ts recent is over'24 days old. */ 
615 if ((int) (tcp now - tp->ts recent age) > TCP PAWS IDLE) { 
616 /* 
617 * Invalidate ts recent. If this segment updates 
618 * ts recent, the age will be reset later and ts recent 
619 * will get a valid value. If it does not, setting 
620 * ts recent to zero will at least satisfy the 
621 * requirement that zero be placed in the timestamp 
622 * echo reply when ts recent isn't valid. The 
623 * age isn't reset until we get a valid ts recent 
624 * because we don't want out-of-order segments to be 
625 * dropped when ts recent is old. 
626 */ 
627 tp->ts recent = 0; 
628 ) else { ` 
629 tcpstat.tcps_rcvduppack++; 
630 tcpstat.tcps_rcvdupbyte += ti->ti len; 
631 tcpstat.tcps_pawsdrop++; 
632 goto dropafterack; 
633 } 
634 } i 
tcp input.c 
U 28-22 (0) 
de PAWS 
602-613 tcp_dooptions ts_present 3 
1) RST ( 28.8) 
2) TCP (ts recent ) 
3) (ts_val) 
PAWS 32 bit 32 bit 
28.6 ( 1) 
24 17 (U 1[] 24.3 ) 
( ) tcp input 
PAWS 
PAWS ACK[] PAWS 
PAWS ([] 28-11) 
2. 
614-627 PAWS 
ts recent ts recent age 
(tcp. now) ts recent 24 
TCP_PAWS_IDLE (24 X 24x 60x 60x 2) 2 2 






















































































































































































































































































































































































762 «wi ú China-pubıcoM 
————————— 























































































































































































































































































































28.6[] 28.7 
28-23 | Net/3[] TCP RFC 
13231 [| | O Net/3 | 
00051 Ee p reus =ts_val=1 
e a SEE ts_recent_age = tcp_now=N 


000025] = 
: 4 320 000 [| 0 
O O O 2 2 147 483 649 00000000 
nnn = 2 147 483 650 , 
U D D D D =2 160 000 001 ts_val = 2 160 000 001 


O O D =2 160 000 001 «ts recent =1 


tcp. now = N + 4 320 000 





















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































0823 000090900 
1 ts_recent 1[] ts recent age 
(tcp. now) 28-11 28-35 0 ODO 250 tcp now 
4 320 000 (25 X 24x 60x 60x 1000) 2 160 000 000 (25 x 24x 60x 60x 
1000) 2 147 483 649 1 2 147 483 650 1( 24-26) 
2 160 000 001 TSTMP LT 
ts recent(l)[] PAWS tcp now ts recent age 
24 
3. 
628-633 PAWS ( 
) 
24-5 tcp pawsdrop (22) tcps_rcvduppack (46 953) 
TCP 
PAWS 
288 000000000000 
28-24 
1. O 0 
635-636 |] (ti seg JD | (rcv. nxt)[] J 
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todropl] UO | | | | | | | | L (0 24-18)[] 
635 todrop = tp->rcv_nxt - ti->ti seg; tep MGE 
636 if (todrop > 0) ( 

637 if (tiflags & TH SYN) { 

638 tiflags &- "TH SYN; 
639 ti->ti_seq++; 

640 if (ti->ti_urp > 1) 

641 ti->ti urp--; 

642 else 

643 tiflags &= “TH URG; 
644 todrop--; 

645 ) 


Te. ep input.c 
























































































































































































































































































































































































































































































































































































































































U 28-24 tcp input D T D D D B Dl LI U D D 00000 
2.0 SYN 
637-645 [][] SYN uu 0 | OM | U U 0 
SYN[] | ID LH D I SYN o [] [] [] 
001(ti_urp U ulti | LU 
0 1 0 1 URG todrop 
10 U SYN ) 
28-25 | Hutt 
- - - tcp input.c 

646 if (todrop »- ti-»ti len) ( 

647 tcpstat.tcps revduppack++; 

648 tcpstat.tcps rcvdupbyte += ti-»ti len; 

649 /* 

650 * If segment is just one to the left of the window, 

651 * check two special cases: i 

652 * 1. Don't toss RST in response to 4.2-style keepalive. 

653 * 2. If the only thing to drop is a FIN, we can drop 

654 * it, but check the ACK or we will get into FIN 

655 * wars if our FINs crossed (both CLOSING). 

656 * In either case, send ACK to resynchronize, 

657 * but keep on processing for RST or ACK. 

658 */ 

659 if ((tiflags & TH FIN && todrop == ti->ti_len + 1) 

660 ) I 

661 todrop = ti->ti len; 

662 tiflags &- “TH FIN; 

663 tp->t flags |= TF ACKNOW; 

664 ) else { 

665 /* 

666 * Handle the case when a bound socket connects 

667 * to itself. Allow packets with a SYN and 

668 * an ACK to continue with the processing. 

669 */ 

670 if (todrop != 0 || (tiflags & TH ACK) == 0) 

671 goto dropafterack; Ë 

672 } 

673 } else { 

674 tcpstat.tcps_rcvpartduppack++; 

675 tcpstat.tcps rcvpartdupbyte += todrop; 


U 28-25 tcp input UU DU 000 0 0 0 0 0 U 









































764 TCP/IP 02 China-bubıcom 
aa 














































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































676 ) 
677 m adj (m, todrop); 
678 ti->ti seg += todrop; 
679 ti->ti len -= todrop; 
680 if (ti->ti_urp > todrop) 
681 ti->ti urp -= todrop; 
682 else ( a 
683 tiflags &- "TH URG; 
684 ti-»ti urp - 0; 
685 3 
686 } : 
tcp input.c 
[ 28-25 ([]) 
3 i 
646-648 | 0 U 0 
| 
4. FIN 
649-663 FIN 28-26 
1 2 3 4 5 6 7 8 9 FIN 
TEOOOOOOOOOOOOONOO 
00000/ ti _len=4FN:0000 rev nxt = 11 
N U D DDD D 
ti_seq=6 
U 2826 O DIO D BO] FIND] BL OL BO DE U D 
28-26[] todrop |] 5 O 0 ti_len(4) FIN todrop 
ti len[] I O [] FIN todrop [] 4 TF ACKNOW 
ACK ti seq ti len 10 
4.2BSD Net/3 OT! 
O) 
5. ACK 
664-672 todrop ( U U U T] U LH) O ACK 0 0 
dropafterack[] [| ACK[] [] MHU qI ACK] 
TCP | ACK 
6. 
664-672 | | | 
todrop 0( ) ACK 
i£l] O [| 4.4BSD | Berkeley 
dropafterack | | | 
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I 
673-676 todrop else 
8. 
677-685 m_adj mbu 
mbuf 
URG 
28-27 
tcp_input.c 
687 /* TER 
688 * If new data is received on a connection after the 
689 * user processes are gone, then RST the other end. 
690 */ 
691 if ((so->so_state & SS NOFDREF) && 
692 tp->t state > TCPS_CLOSE_WAIT && ti->ti Jen) { 
693 tp = tcp_close(tp); 
694 tcpstat.tcps_rcvafterclose++; 
695 goto dropwithreset; 
696 } . 
tcp. input.c 
[] 28-27 tcp input I0000000000000000 
687-696 ( 24-16 
CLOSE WATT 5 ) 
RST 
TCP ( ) 
TCP FIN FIN WAIT 1 
FIN 
28-27 FIN 
28-28 
tcp_input.c 
697 /* ED 
698 * If segment ends after window, drop trailing data 
699 * (and PUSH and FIN); if nothing left, just ACK. 
700 */ 
701 todrop = (ti->ti seq + ti->ti len) - (tp->rcv_nxt + tp->rcv_wnd); 
702 if (todrop > 0) í 
703 tcpstat.tcps_rcvpackafterwin++; 
704 if (todrop >= ti->ti_len) { 
705 tcpstat.tcps rcvbyteafterwin += ti->ti len; 
706 /* 
707 * If a new connection request is received 
708 * while in TIME WAIT, drop the old connection 
709 * and start over if the sequence numbers 
710 * are above the previous ones. 
711 SI 
712 if (tiflags & TH SYN && 
713 tp->t state == TCPS TIME WAIT && 


0 28-28 tcp input )0000000000000 


766 





TCP/IP 2 
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714 SEQ_GT(ti->ti_seq, tp-»rcv nxt)) ( 
715 iss - tp-»rcv nxt 4 TCP ISSINCR; 
716 tp - tcp close(tp); 
717 goto findpcb; 
718 H 
719 FE 
720 * If window is closed can only take segments at 
721 * window edge, and have to drop data and PUSH from 
722 * incoming segments. Continue processing, but 
723 * remember to ack. Otherwise, drop segment 
724 * and ack. 
725 */ 
726 if (tp->rev_wnd == 0 && ti->ti seq == tp-»rcv nxt) { 
727 tp->t_flags |= TF_ACKNOW; 
728 tcpstat.tcps_rcvwinprobe++; 
729 } else 
730 goto dropafterack; 
731 } else 
732 tcpstat.tcps rcvbyteafterwin += todrop; 
733 m_adj (m, -todrop); 
734 ti->ti_len -= todrop; 
735 tiflags &= “(TH PUSH | TH FIN); 
736 ; 
tep input.c 
H 28-28 (O) 
9. 
697-703 todrop 28-29 
todrop (6+5) (4+6) 1 
"rcv wndz6: 0000 
HUDHDUUD 
1 2 3 10 11 .. 
00000000 4 
rev nxt =4 x rcv. adv = 10 
"os ti lenz5 
(0000 6 7 8 9 
ti seq=6 
0 2829 [00000000000000000 
10. TIME WAIT 
704-718 todrop 3 
1) SYN 
2) TIME WAIT 
3) 
TIME WAIT RFC 1122 
ISS (rev nxt)[] TCP[] rcv. nxt 
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128 000(TCP. ISSINCR)[] [] 28-17 UDE ISS| tcp. close) |] 
TIME WAIT PCB[] TCP 0 findpcb([] 28-5) 
000000 PCB( JG | 0 28-70 00 uuu 
28-16[] [] 28-17 g 
11. 
719-728 (rcv_wnd| 0) E 
(rcv. nxt) TCP ACK 
U 
12. LU U U U U U 
729=730 10000 U 000000000000 U U U 
| | ACK 
13. U 
731-735 m_adj mbu | ti len 
m adj mbuf ti len 
OM] FIND PSH 
I ACK 
28-25 U) | | UU U 
dropafterack[Carlson 1993; Lanciani 1993] 0 0 
g 0 | 0 ACK 
28-25 dropafterack 
u FIN] | | ACK| O 28-25] [| 646-676 
28-30 | ( 28.9) 
if (todrop > ti->ti_len || 
todrop == ti->ti_len && (tiflags & TH_FIN) == 0) { 
/* 


* Any valid FIN must be to the left of the window. 
* At this point the FIN must be a duplicate or 

* out of sequence; drop it. 

*/ 

tiflags &= "TH FIN; 


/* 
* Send an ACK to resynchronize and drop any data. 
* But keep on processing for RST or ACK. 
*/ 
tp->t flags |= TF_ACKNOW; 
todrop = ti->ti len; 
tcpstat.tcps_rcvdupbyte += todrop; 
tcpstat.tcps_rcvduppack++; 


} else { 
tcpstat.tcps_rcvpartduppack++; 
tcpstat.tcps_rcvpartdupbyte += todrop; 


U 28-30 [| 28-28] 646-676[] 00000 






































768 TCP/PQU (2 China-bubıcom 
— a 


289 00000000 








































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































4.4BSD 
0 28-250 0 000090 OH HHH 4.4BSD] 0 0 
E 0 E [] socket[] bind 
E ( 3000) connect 
connect 0 | | L] LU u 
| RFC 1122 
0 Uu 0 0 Internet PCB TCP 
[] TCP[] | 
[| 28-31[] Ul [| connect 0 O SYN E E 
SYN SENT 
SYN O O 28-18 28-20 0 SYN ACK 
SYN RCVD 0 (Y 24-15) 28-32 
O O 28-20 TF ACKNOW[] tcp. output Ü 10 0 SYNU ACK([] 24- 
16 tcp outflags)[] SYN O 1530 | | 154 
SYN 
00 SYN: 153 154 155 ... HH =SYN_SENT 
snd una snd_nxt 
snd_max 
U 28-31 000.0 $80 00000000 0 
SYN 
DD SYN: 153 154 155 = DO =SYN_RCVD 
rev nxt 
0 28-32 [000000SYNDOOOOOODOOOO 
28-20 | 0 SYN SENT 
28-33 SYN[] ACK 
SYN 
O O SYN, ACK: 153 154 155 
rcv_nxt 


0 28-33 0000 SYND ^ck;nBDüDüDü Da OD UD 

















28 


TCP 





























769 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































SYN_RCVD 29-2 
28-24 
SYN 
todrop = rcv nxt - rcv seq 
= 154 - 153 
SYN ti seq 154[] todrop 0 todrop 
(0) 28-25 " 
u TCP dropafterack O 
SYN_RCVD todrop 0 ACK 
( )[] Net/3 
SYN RCVD ESTABLISHED 
28-34 
connect ogg 
soconnect 
tcp_ output tcp input tcp output tcp input 
ip output ipintr ip output ipintr 
| ! 000 | | 000 
looutput looutput 
000 ipintrq 000 ipintra 
U D 00 SYN 00 SYN O I SYN, ACK O 0 SYN, ACK 
0000 CLOSED SYN SENT SYN RCVD SYN_RCVD 
0000 SYN SENT SYN RCVD SYN RCVD ESTABLISHED 
U 28-34 DUH ü B D] HD B D. I B U 
| E o connect PRU. CONNECT[] [] [] 
SYN 0 0 | IP | | ipintrq 





























































































































































































































ipintr 














ipintr 














tcp input 


























tcp input 























770 









































China-pubecom 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP/IP 2 
tcp output ACK[] SYN ipintrq 
ipintr ipintr tcp input 
ESTABLISHED 
28.10 00000 
28-35 tcp input 
737 Tx : tcp_input.c 
738 * If last ACK falls within this segment’s sequence numbers, 
739 * record its timestamp. 
740 */ 
741 if (ts present && SEQ LEQ(ti-»ti, seq, tp->last ack sent) && 
742 SEQ LT(tp->last ack sent, ti->ti seg + ti-»ti len + 
743 ((tiflags & (TH SYN | TH FIN)) != 0))) € 
744 tp-»ts recent age = tcp now; 
745 tp->ts recent = ts val; 
746 } 
tep input.c 
0 28-35 top input [I 000000 
737-746 ts recent 26.6 
Net/3 FIND SYN 
((tiflags 8 (TH_SYN|TH_FIN)) != 0) 
0 1 
28.11 RSTOD 
28-36| RST switch 
1. SYN RCVD 
759-761 ECONNREFUSED 
SYN LISTEN SYN RCVD 
TCP ACK[] SYN RST so 
28-7 sonewconn dropsocket drop 
24-15 SYN RCVD LISTEN 
connect SYN RCVD 
RST 
tcp input.c 
747 /* 
748 * If the RST bit is set examine the state: 
749 * SYN RECEIVED state: ' 
750 * If passive open, return to LISTEN state. 
751 * If active open, inform user that connection was refused. 
752 = ESTABLISHED, FIN WAIT 1, FIN_WAIT2, CLOSE WAIT states: 
753 * Inform user that connection was reset, and close tcb. 
754 * CLOSING, LAST ACK, TIME WAIT states 
755 * Close the tcb. 
756 */ 


[] 28-36 tcp input 00000 RSTO U 

















Chi HILL 28 TCP 771 




















































































































































































































































































































































































































































































































































































































































































































































































































757 if (tiflags & TH RST) 
758 switch (tp->t state) ( 
759 case TCPS SYN RECEIVED: 
760 So-»so error = ECONNREFUSED; 
761 goto close; 
762 case TCPS ESTABLISHED: 
763 case TCPS FIN WAIT 1: 
764 case TCPS FIN WAIT 2: 
765 case TCPS CLOSE WAIT: 
766 s0->so error = ECONNRESET; 
767 close: 
768 tp->t state - TCPS, CLOSED; 
769 tcpstat.tcps dropst++; 
770 tp = tcp_close(tp); 
771 goto drop; 
772 case TCPS CLOSING: 
773 case TCPS_LAST_ACK: 
774 case TCPS TIME WAIT: 
775 tp = tcp_close (tp); 
776 goto drop; 
777 å 
} tcp_input.c 
H 28-36 ([]) 
2. 

762-777 ESTABLISHED[] FIN WAIT 1[] FIN WAIT 2[] CLOSE WAIT 
RST ECONNRESET CLOSING[] LAST ACK[] TIME WAIT 
RST TIME WAIT TIME WAIT 

RFC 1337 [Braden 1992] TIME WAIT 
RST TIME WAIT 28.10 
28-37 SYN ACK 
778 Tx tcp input.c 
779 £ If a SYN is in the window, then this is an - 
780 * error and we send an RST and drop the connection. 
781 */ 
782 if (tiflags & TH SYN) ( 
783 tp = tcp drop(tp, ECONNRESET); 
784 goto dropwithreset; 
785 ) 
786 PE 
787 * If the ACK bit is off we drop the segment and return. 
788 */ 
789 if ((tiflags £ TH_ACK) == 0) 
790 goto drop; 
tcp input.c 
[] 28-37 tcp input 0200000000 SYN[I DD H ACKD D DU 
778-785 SYN 














ECONNRESE 



































































































































































































































772 TCP/IP 2 China-pub.com 
a — — Hi 





































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































786-790 ACK | 
| U U ACK 
28.12 00 
TCP 
| TCP 0 
SYN 0 RST 
U U 
25.1 Net/3 262 444 28-7 
28.2 Net/3 0 262 444 LU LU 60ms[] 0 
0 ( 0 1 24-5 ) 
28.3 28-10 bcopy 
28.4 26.6 TCP RFC 1323 A 
TCP 
28.5 PRU_ATTACH PCB[] TCP 
tcp template SYN 28-17 
28.6 RFC 1323 28-22 24 
28.7 28-22 24 tcp now-ts recent age 
TCP_PAWS_IDLE|] |] | Net/3 | 500ms | 
28.8 RFC 1323 28-221] PAWS RST| 
28.9 SYN SYN/ACK ESTABLISHED 
ACK ACK SYN/ACK 
SYN/ACK| 
28.10 | U 
TIME_WAIT 2MSL ( 
) SYN 



































































































































































































































Dik dek 


U 29] ICPU DO (0) 


291 UI 


























































































































































































































































































































































































































































































































































































































































































































































































































Di O TCP| | OOO 28-37 E 
0 ACK[] 0 0 0 
ACK URG L 
FIN tcp output 
29.2 ACKDODO 
UH ACK] [] | 29-1 [] ACK | SYN RCVD 
U 0 (| 0 LISTEN[] SYN SENT 
ACK ) TCPS FIN WAIT lT TCPS CLOSING 
TCPS LAST ACK[] U U U U U U U U U U U ACOOOOOOOOOO 
TIME WAITO | ACK[] 2MSL Ul | 

















































































































switch (tp->t state) { 


case 


complete processing of passive open and process 


case 
case 
case 
case 
case 
case 
case 


TCPS SYN RECEIVED: 


simultaneous open or self-connect; 
/* fall into ... */ 


TCPS ESTABLISHED: 
TCPS FIN WAIT 1: 
TCPS FIN WAIT 2: 
TCPS CLOSE WAIT: 
TCPS CLOSING: 
TCPS LAST ACK: 
TCPS TIME WAIT: 


. process duplicate ACK; 


update RTT estimators; 


if all outstanding data ACKed, turn off retransmission timer; 


remove ACKed data from socket send buffer; 


switch (tp->t state) { 


case TCPS FIN WAIT 1: 


if (FIN is ACKed) ( 


move to FIN WAIT 2 state; 
start FIN WAIT 2 timer; 


} 
break; 


case TCPS_CLOSING: 


if (FIN is ACKed) { 


D 29-1 


ACK] O00 


774 


China-pub.con 





TCP/IP 2 









































move to TIME WAIT state; 
start TIME WAIT timer; 


H 
break; 


case TCPS LAST ACK: 


if (FIN is ACKed) 
move to CLOSED state; 
break; 


case TCPS TIME WAIT: 


restart TIME WAIT timer; 
goto dropafterack; 






















































































































































































































































































































































































































































































































































































































































































3 
U 29-1 (0) 
29.3 00000000000 
29-2 SYN_RCVD]|] [| ACK | 
( ) | ( ) | 

1. ACK 
801-806 ACK] SYN snd una (tcp sendseqinit 
snd una ISS[] SYN ) snd max 

ESTABLISHED 
tcp input.c 

791 Tr 

792 * Ack processing. 

793 : 

794 switch (tp-»t state) { 

795 1* 

796 * In SYN_RECEIVED state if the ack ACKs our SYN then enter 

797 * ESTABLISHED state and continue processing, otherwise 

798 * send an RST. 

799 */ 

800 case TCPS_SYN_RECEIVED: 

801 if (SEQ GT(tp->snd una, ti-»ti ack) || 

802 SEQ_GT(ti->ti_ack, tp->snd_max) ) 

803 goto dropwithreset; 

804 tcpstat.tcps_connects++; 

805 soisconnected (so); 

806 tp->t_state = TCPS_ESTABLISHED; 

807 /* Do window scaling? */ 

808 if ((tp->t flags & (TF RCVD SCALE | TF REQ SCALE)) == 

809 (TF RCVD SCALE | TF REQ SCALE)) I 

810 tp->snd scale = tp->requested s scale; 

811 tp-»rcv scale = tp->request r scale; 

812 ) 

813 (void) tcp reass(tp, (struct tcpiphdr *) 0, (struct mbuf +) 0); 

814 tp->snd wll = ti->ti seq - 1; 

815 /* £all into ... */ 





tcp input.c 


[] 29-2 tcp input J O00 SYN Rcv JO D] [] ACK 











China-bubıtom wa romana) 775 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































soisconnected 
( ) accept 
select 
2. 
807-812 TCP TCP 
TCP snd_scalel] rcv scale 
O( ) 
3. 
813 tcp_reass 
SYN SYN_RCVD 
814 snd_wll 1 29-15 3 
294 IJI0000000000 
29-3 ACK ACK TCP 
[Jacobson 1990c] [Floyd 1994] 
. ( 3l] ) ACK TCP 
RFC 1122 4.2.2.21 
TCP ACK 27-15 
Net/3 4.3BSD Tahoe Net/1 
s ( ) 
4.3BSD Reno Net/2 
Net/3 
24-171] U ACK 
snd_una < OO <= snd max 
snd_una 29-5 
ACK 5 
1) snd_una 
2) 0 
3) 
4) ( ) 
5) TCP ( snd una) 
ACK( 10) 20 3 29-3 4[] 5 29-4 
) 
TCP ACK t_dupacks 
(tcprexmtthresh[] 3) 1[] 21.7 
2[] -15 TCP ACK 





























































































































































































































776 





China-pubecom 




















































































































































































































































































































































































































TCP/IP 2 
TCP 
1[] 21.7 
ETE 2 icp input.c 
817 * In ESTABLISHED state: drop duplicate ACKs; ACK out-of-range 
818 * ACKs. If the ack is in the range 
819 * tp-»snd una < ti-»ti ack <= tp->snd max 
820 * then advance tp->snd una to ti-»ti ack and drop 
821 * data from the retransmission queue. If this ACK reflects 
822 * more up-to-date window information we update our window information. 
823 */ 
824 case TCPS ESTABLISHED: 
825 Case TCPS FIN WAIT 1: 
826 case TCPS FIN WAIT 2: 
827 case TCPS CLOSE WAIT: 
828 case TCPS CLOSING: 
829 case TCPS LAST ACK: 
830 Case TCPS TIME WAIT: 
831 if (SEQ LEQ(ti-»ti ack, tp->snd una)) { 
832 if (ti-»ti len == 0 && tiwin == tp-»snd wnd) ( 
833 tcpstat.tcps_rcvdupack++; 
834 /* 
835 * If we have outstanding data (other than 
836 * a window probe), this is a completely 
837 * duplicate ack (ie, window info didn't 
838 * change), the ack is the biggest we've 
839 * seen and we've seen exactly our rexmt 
840 * threshold of them, assume a packet 
841 * has been dropped and retransmit it. 
842 * Kludge snd nxt & the congestion 
843 * window so we send only this one 
844 * packet. 
845 u 
846 * We know we're losing at the current 
847 * window size so do congestion avoidance 
848 * (set ssthresh to half the current window 
849 * and pull our congestion window back to 
850 * the new ssthresh). 
851 * 
852 * Dup acks mean that packets have left the 
853 * network (they're now cached at the receiver) 
854 * so bump cwnd by the amount in the receiver 
855 * to keep a constant cwnd packets in the 
856 * network. : 
857 */ 


————————————  nVn Be input.c 





O 29-3 tcp inut JO0O0000000 ACKD UD 


u ” 













































































ACK 






























































ACK ACK 










































































TCP 
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5 3 ACK tcps rcvdupack 
1 ACK (t dupacks) 0 
t dupacks 0 
29-4 5 
ACK 
1) t dupacks 3(tcprexmtthresh) 





















































































































































2) t dupacks 3 TCP 
3) t dupacks 3 



























































































































































































































































































































































































































































































































































































































































- - tcp. input.c 
858 if (tp->t timer[TCPT REXMT] == ll 
859 ti->ti_ack != tp->snd una) 
860 .tp->t dupacks = 0; 
861 else if (++tp->t_dupacks == tcprexmtthresh) ( 
862 tcp_seq onxt = tp->snd nxt; 
863 u_int win = 
864 min(tp->snd_wnd, tp->snd_cwnd) / 2 / 
865 tp->t_maxseg; 
866 if (win < 2) 
867 win = 2; 
868 tp->snd_ssthresh = win * tp->t maxseg; 
869 tp-»t timer[TCPT REXMT] = 0; 
870 tp-»t rtt - 0; 
871 tp->snd_nxt = ti-»ti ack; 
872 tp->snd_cwnd = tp->t_maxseg; 
873 (void) tcp output (tp); 
874 tp->snd cwnd = tp->snd_ssthresh + 
875 tp->t_maxseg * tp->t_dupacks; 
876 if (SEQ_GT(onxt, tp->snd_nxt)) 
877 tp->snd_nxt = onxt; 
878 goto drop; 
879 } else if (tp->t_dupacks > tcprexmtthresh) { 
880 tp->snd_cwnd += tp->t_maxseg; 
881 (void) tcp output (tp) ; 
882 goto drop; 
883 } 
884 } else 
885 tp->t_dupacks = 0; 
886 break; /* beyond ACK processing (to step 6) */ 
887 } š 
tcp input.c 
U 29-4 tcp input [000000 ACK 
1. [] ACK 3 
861-868 t dupacks 3(tcprexmtthresh) onxt snd_nxt 
(ssthresh) 
25-27 
2. 













































































869-870 TCP Lt rtt 






































































































































778 
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TCP/IP 2 
3. 
871-873 ACK ( ACK 
) snd_nxt tcp_output 
( 1 21-7 63 ) 
4. 
874-875 d Ñ 
ACK ( 
) 1 21-10 21-11 
5 snd_nxt 
876-878 (snd_nxt) (onxt) 
snd_nxt tcp_output snd_nxt 
snd_nxt tcp_output 
6. ACK 3 
879-883 t_dupacks 3 ACK 
1 tcp_output 
ACK( 1 21-7[] 67 69 71 
884-885 ACK 
5 ACK 
7. ACK 
886 break 3 (1) 5 (2) 
3 (3) ACK 3 
ACK break 29-21) switch step6 
8 
1-8 1 2 
3] 4 (1) 5-8 TCP 
9 8 9 
ACK 1 ACK TCP 
1 
1 21-10 ACK 
ACK 
29.5 ACKOD 
29-5 ACK 
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tcp input.c 
888 ZS 
889 * If the congestion window was inflated to account 
890 * for the other side’s cached packets, retract it. 
891 */ 
892 if (tp->t dupacks > tcprexmtthresh && 
893 tp->snd cwnd > tp->snd ssthresh) 
894 tp->snd cwnd = tp->snd ssthresh; 
895 tp->t dupacks = 0; 
896 if (SEQ_GT(ti->ti_ack, tp-»snd max)) { 
897 tcpstat.tcps_rcvacktoomuch++; 
898 goto dropafterack; 
899 } 
900 acked = ti->ti_ack - tp->snd_una; 
901 tepstat .tcps_revackpack++; 
902 tcpstat.tcps_rcvackbyte += acked; . 
tcp input.c 
[| 29-5 tcp input JO O O J ACKO [| 
1. 
888-895 ACK 3 4 4 
ACK ACK 4 
ACK ACK 1 
ACK 
2. ACK 
896-899 ACK| 
snd una < JO) [ <= snd. max 
snd max TCP 
ACK 24-5 
( ) 
3. 
900—902 ACK[] acked 
29-6 ACK RTT 
4. RTT 
903-915 (1) (2)TCP 
tcp_xmit_timer RTT 
tcp_xmit_timer (tcp. now) (ts. ecr) 
1( 1) 
ACK TCP 
1~1024 1025~2048 
2049 2049 1( )[] TCP RTT 
5. 
916-924 (ti_ack) TCP (snd_max) 
needoutput 























































































































































































































780 
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tcp output TCP 
ACK ( 
29-8 snd una ) 
tcp_input.c 
903 /* cpmp 
904 * If we have a timestamp reply, update smoothed 
905 * round-trip time. If no timestamp is present but 
906 * transmit timer is running and timed sequence 
907 * number was acked, update smoothed round-trip time. 
908 * Since we now have an rtt measurement, cancel the 
909 * timer backoff (cf., Phil Karn's retransmit alg.). 
910 * Recompute the initial retransmit timer. 
911 */ ` 
912 if (ts present) 
913 tcp.xmit timer(tp, tcp now - ts ecr + 1); 
914 else if (tp-»t rtt && SEQ GT(ti-»ti eck, tp-»t rtseq)) 
915 tcp xmit, timer(tp, tp-»t rtt); 
916 /* 
917 * If all outstanding data is acked, stop retransmit 
918 * timer and remember to restart (more output or persist). 
919 * If there is more data to be acked, restart retransmit 
920 * timer, using current (possibly backed-off) value. 
921 */ 
922 if (ti->ti_ack == tp->snd max) { 
923 tp->t timer [TCPT_REXMT] = 0; 
924 needoutput = 1; 
925 } else if (tp->t_timer[TCPT_PERSIST] == 0) 
926 tp->t_timer[TCPT_REXMT] = tp-»t rxtcur; A 
tcp_input.c 
0 29-6 tcp input I DO RTTIOOOOOOOO 
6. 
925-926 
t_rxteur 
Karn 
Karn (O 10 21.3[] ) 
RTT ( 
) 25-26 Karn t rtt 0 
29-6 RTT 
t rtt 0 t rtt 
RTT RFC 1323 ts ecr 
Karn 
29-7 ACK 
927 = tcp input.c 
928 * When new data is acked, open the congestion window. 
929 * If the window gives us less than ssthresh packets 


U 29-7 tcp input JO0000000Ack 00 0 U D D 
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930 * in flight, open exponentially (maxseg per packet). 
931 * Otherwise open linearly: maxseg per window 
932 * (maxseg^2 / cwnd per packet), plus a constant 
933 * fraction of a packet (maxseg/8) to help larger windows 
934 * open quickly enough. 
935 */ 
936 { 
937 u_int cw = tp->snd_cwnd; 
938 u_int incr = tp->t_maxseg; 
939 if (cw > tp->snd_ssthresh) 
940 iner = incr * incr / cw + incr / 8; 
941 tp->snd_cwnd = min(cw + incr, TCP_MAXWIN << tp->snd scale); 
942 } å 
tcp input.c 
129-7 (0) 
1. 
927-942 ACK 
ACK( ) 1 1 
incr * incr / cw 
t_maxseg * t_maxseg / snd_cwnd 
1 snd_cwnd 
1/8 1 
21.8 
( 1/8) [Floyd 1994] 
BSD 4.3BSD[] 4.4BSD[] Net/3 
29-8 tcp input 
- tcp input.c 
943 if (acked > so-»so snd.sb cc) ( 
944 tp->snd wnd -= so->so snd.sb cc; 
945 sbdrop (&so->so_snd, (int) so-»so snd.sb cc); 
946 ourfinisacked = 1; i 
947 } else { 
948 sbdrop (&so->so_snd, acked); 
949 tp->snd_wnd -= acked; 
950 ourfinisacked = 0; 
951 ) . 
952 if (so-»so snd.sb flags & SB NOTIFY) 
953 sowwakeup (so); 
954 tp->snd una = ti-»ti ack; 
955 if (SEQ LT(tp->snd nxt, tp->snd una)) 
956 tp->snd nxt = tp-»snd una; . 
tcp input.c 


029-8 tcp input U UU 00 0000 0 0 0 0 0 0 0 0 





2: 
943-946 snd_wnd 



























































































































































































































































782 seman 02 China+pub.tom 
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FIN sbdrop 
FIN FIN 
947-951 |] ourfinisacked 0 
E acked 0 
3. 
951-956 sowwakeup snd_una 
snd_una snd_nxt 
29-9 | snd_nxt Uu snd una 0 
1-512 513-1024 
1 2 äs 512 513 514 PE 1024 1025 
— — —'nn A  -— —ə — OMI OU .-— —— _ 
4 (0000 (0000 å 
snd una snd nxt 
snd max 
[299 79008000080 
25-26 snd_nxt snd_una 
tcp_output 1-512 tcp output[] snd_nxt 
513 29-10 
1 2 SN 512 513 514 — 1024 1025 
— 
A (0000 A A 
snd_una snd_nxt snd_max 
029-10 900000002000 (ID 29-9) 
1025[] ACK ( ACK 
) ACK snd_max snd_una 
ACK 29-11 switch 4 
tcp_input.c 
957 switch (tp->t_state) { SE 
958 /* 
959 * In FIN WAIT 1 state in addition to the processing 
960 * for the ESTABLISHED state if our FIN is now acknowledged * 
961 * then enter FIN WAIT 2. 
962 Si 
963 case TCPS FIN WAIT 1: 
964 if (ourfinisacked) { 
965 /* 
966 * If we can't receive any more 
967 * data, then closing user can proceed. 
968 * Starting the timer is contrary to the 


[29-11 tcp input 00 0 0 FIN WAIT 10 00000 ACK 
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969 * specification, but if we don't get a FIN 
970 * we'll hang forever. 
971 */ 
972 if (so-»so state & SS CANTRCVMORE) I 
973 soisdisconnected (so); 
974 tp->t_timer[TCPT_2MSL] = tcp_maxidle; 
975 } 
976 tp->t_state = TCPS_FIN_WAIT_2; 
977 } 
978 break; . 
tcp input.c 
H 29-11 ([]) 
4. [] FIN WAIT 1 ACK 
958-971 TCP FIN FIN 
FIN FIN. WAIT 2 
29-8 ourfinisacked 
5. FIN WAIT 2 
972-975 25.6 Net/3 FIN. WAIT 2 FIN. WAIT 2 
([] close 
close ) ( FIN 
) 
29-12 CLOSING ACK 
tcp_input.c 
979 /* ver 
980 * In CLOSING state in addition to the processing for 
981 * the ESTABLISHED state if the ACK acknowledges our FIN 
982 * then enter the TIME-WAIT state, otherwise ignore 
983 * the segment. 
984 */ 
985 case TCPS CLOSING: 
986 if (ourfinisacked) ( 
987 tp->t state = TCPS TIME WAIT; 
988 tep_canceltimers (tp); 
989 tp-»t timer[TCPT 2MSL] = 2 * TCPTV_MSL; 
990 Soisdisconnected(so); 
991 } 
992 break; I 
tcp_input.c 
0 29-12 tcp input 0000 CLOSING] [| 9 0 ACK 
6. || CLOSING ACK 
979-992 ACK FIN ( ) 
TIME_WAIT ( Jl] TIME WAIT 
MSL 





































































































29-13 LAST ACK ACK] [| 



























































784 
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TCP/IP 2 

gus m tcp input.c 
994 * In LAST ACK, we may still be waiting for data to drain 

995 * and/or to be acked, as well as for the ack of our FIN. 

996 * If our FIN is now acknowledged, delete the TCB, 

997 * enter the closed state, and return. 

998 *7 

999 case TCPS LAST ACK: 
1000 if (ourfinisacked) { 
1001 tp = tcp close(tp); 
1002 goto drop; 
1003 } 
1004 break; 

tcp_input.c 
0 29-13 tcp input J [| [ [| LAST ACK[ [] [] [] ACK 
7. 0 LAST ACK ACK 
993-1004 FIN CLOSED tcp close 
Internet PCB[] TCP 
29-14 TIME WAIT ACK| 

1005 "m tcp input.c 
1006 * In TIME WAIT state the only thing that should arrive 

1007 * is a retransmission of the remote FIN.  Acknowledge 

1008 * it and restart the finack timer. 

1009 */ 

1010 case TCPS_TIME_WAIT: 

1011 tp->t_timer [TCPT_2MSL] = 2 * TCPTV_MSL; 

1012 goto dropafterack; 

1013 } 

1014 } A 

tcp input.c 





8. [| TIME WAIT 





1005-1014 


29-14 tcp input 0000 TIME WAITQ D DD ACK 














ACK 























FIN 























FIN 
































TCPII [| 


























FIN 


















































FIN( 








ACK) 





TCP 






























































TIME WAIT 

























































































MSL 

















296 000 


U U U 





TCP 

















snd wll 








snd wl2 









































end wll 







































































(snd wnd) 








e end wl2 














































































































ACK 































































































































































































snd wll 








ti_seq| 1 
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(snd 











wnd) 


























1) 















































snd_wll 


























(tiwin) 
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snd_wll<ti_seq 
2) (snd, w11 ti seq) snd wl2 


snd wl2«ti ack 






























































































































































































































































































































































































































































































































































































































































































































































































































































3) 
snd una 

29-15 
1015 steps: Ek a 
1016 /* 
1017 * Update window information. 
1018 * Don't look at window if no ACK: TAC's send garbage on first SYN. 
1019 */ 
1020 if ((tiflags € TH_ACK) && 
1021 (SEQ LT(tp->snd wll, ti->ti seq) || tp->snd_wll == ti->ti seq && 
1022 (SEQ LT(tp->snd wl2, ti->ti ack) || 
1023 tp->snd wl2 == ti->ti ack && tiwin > tp->snd wnd))) ( 
1024 /* keep track of pure window updates */ 
1025 if (ti->ti len == 0 && 
1026 tp->snd wl2 == ti->ti ack && tiwin > tp->snd wnd) 
1027 tcpstat.tcps_rcvwinupd++; 
1028 tp->snd_wnd = tiwin; 
1029 tp->snd wll = ti->ti_seg; 
1030 tp->snd wi2 = ti->ti_ack; 
1031 if (tp->snd_wnd > tp->max_sndwnd) 
1032 tp->max_sndwnd = tp->snd_wnd; 
1033 needoutput = 1; 
1034 } 


= ep input.c 































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































O 29-15 tcp input 0 D D D 00 0 0 U 
1. 
1015-1023 if ACK 3 
LISTEN SYN_SENT SYN step6 
LISTEN SYN ACK 
TAC “ (terminal access controller)” ARPANET 
Telnet 
1024-1027 ( OTT ACK 
) tcps_rcvwinupd 
2. 
1028-1033 snd wll[| and w12 
TCP max sndwnd 
26-8 snd wnd 
needoutput 





















































































































































786 


29.7 D00000 
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TCP/IP 2 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCP| URG 29-16 
tcp. input.c 
1035 /* PEE 
1036 * Process segments with URG. 
1037 */ 
1038 if ((tiflags & TH_URG) && ti->ti_urp && 
1039 TCPS_HAVERCVDFIN (tp->t_state) == ot 
1040 /* 
1041 * This is a kludge, but if we receive and accept 
1042 * random urgent pointers, we'll crash in 
1043 * soreceive. It’s hard to imagine someone 
1044 * actually wanting to send this much urgent data. 
1045 */ 
1046 if (ti->ti urp + so-»so rcv.sb cc > sb max) í 
1047 ti->ti urp = 0; /* XXX */ 
1048 tiflags &= "TH URG; /* XXX */ 
1049 goto dodata; /* XXX */ 
1050 } S 
tcp input.c 
U 29-16 tcp input 0.0 0 U D D 0 0 0 0 
1. URG 
1035-1039 URG 
(ti_urp) FIN TIME_WAIT 
TCPS_HAVERCVDFIN URG 
CLOSE WAIT[] CLOSING[] LAST ACK[] TIME WAIT 
URG 
2. 
1040-1050 
URG 
29-17[] tcp input 
tcp input.c 
1051 zi cp_mp 
1052 * If this segment advances the known urgent pointer, 
1053 * then mark the data stream. This should not happen 
1054 '* in CLOSE WAIT, CLOSING, LAST ACK or TIME WAIT states since 
1055 * a FIN has been received from the remote side. 
1056 * In these states we ignore the URG. 
1057 * 
1058 * According to RFC961 (Assigned Protocols), 
1059 * the urgent pointer points to the last octet 
1060 * of urgent data. We continue, however, 
1061 * to consider it to indicate the first octet 
1062 * of data past the urgent section as the original 
1063 * spec states (in one of two places). 
1064 */ 
1065 if (SEQ GT(ti->ti seq + ti->ti_urp, tp->rcv_up)) { 


0 29-17 tcp input J00000000000 
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1066 tp->rcv_up = ti->ti_seq + ti->ti_urp; 
1067 so->so_oobmark = so->so_rcv.sb_cc + 
1068 (tp->rcv_up - tp->rcv_nxt) - 1; 
1069 if (so->so_oobmark == 0) 
1070 so->so_state |= SS_RCVATMARK; 
1071 sohasoutofband (so); 
1072 tp->t_oobflags &= ” (TCPOOB_HAVEDATA | TCPOOB HADDATA) ; 
1073 } 
1074 /* i 
1075 * Remove out-of-band data so doesn't get presented to user. 
1076 * This can happen independent of advancing the URG pointer, 
1077 * but if two URG's are pending at once, some out-of-band 
1078 * data may creep in... ick. 
1079 *y 
1080 if (ti-»ti urp <= ti-»ti len 
1081 #ifdef SO OOBINLINE 
1082 KK (so->so options & SO OOBINLINE) == 0 
1083 #endif 
1084 ) 
1085 tcp pulloutofband(so, ti, m); 
1086 ) else ( 
1087 FE 
1088 * If no out-of-band data is expected, pull receive 
1089 * urgent pointer along with the receive window. 
1090 */ 
1091 if (SEQ GT(tp-»rcv nxt, tp->rcv up)) 
1092 tp-»rcv up = tp->rcv_nxt; 
1093 ) . 
tcp input.c 
[] 29-17 ([]) 
1051-1065 
26-30 3 29- 
18 
(rcv up) 00000 
rcv_nxt if ti_len=3 
(4 3 All rev up 7 4 5 6 
3. 
1066-1070 
rcv_nxt 
rcv, up 
ti se 
(so rcv.sb cc) aii: 
i G 2 ti_urp=3 
mar 
en ee 0000000 
6 
Ü U 29-18 26-30 80000000000 
send 1 
Berkeley 
4. TCP 




























































































































































































1071-1072 sohasoutofband 




























































































788 TCP/IP 2 China=pupecom 
— — ——mm 
















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































TCPOOB_HAVEDATA|| TCPOOB HADDATA 30-8 PRU RCVOOB 
5. 
1074-1085 
TCP 
SO OOBINLINE ( Net/3 ) 
t iobc 
tcp pulloutofband 
TCP[] [| | 
TCP 
6. 
1086-1093 rcv nxt rcv up 
rcv nxt URG 
29-17 SEQ GT 
26.6 29-160 0 29-17 
29.8 tcp pulloutofband[||[]| 
29-17 
1) 
2) ( ) 
3) SO OOBINLINE 
( mbuf[] ) TCP 
t iobc recv MSG OOB 
30-8 PRU RCVOOB 29-19 
tcp. input.c 
1282 void en 
1283 tcp pulloutofband(so, ti, m) 
1284 struct socket *so; 
1285 struct tcpiphdr “ti; 
1286 struct mbuf *m; 
1287 { 
1288 int ent = ti->ti_urp - 1; 
1289 while (cent >= 0) { 
1290 if (m->m len > cnt) { 
1291 char *cp = mtod(m, caddr t) + cnt; 
1292 struct tcpcb *tp = sototcpcb(so); 
1293 tp->t_iobc = *cp; 
1294 tp->t_oobflags |= TCPOOB_HAVEDATA; 
1295 bcopy (cp + 1, cp, (unsigned) (m->m_len - cnt - 1)); 
1296 m->m_len--; 
1297 return; 
1298 } 
1299 cnt -- m-»m len; 


[] 29-19 tcp pulloutofpamd 00000000000 tiae OOD 
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1300 m = m->m_next; 
1301 if (m == 0) 
1302 break; 
1303 } 
1304 panic ("tcp_pulloutofband") ; 
1305 } I 
tep input.c 
0 29-19 ([]) 
1282-1289 29-20 3 7 
6 5 mbu 
ent 2 m len( 5) 2 if 
1290-1298 cp 6 t_iobc 
TCPOOB_HAVEDATA bcopy ( 718 1 29- 
21 
00000 t. iobc 
m len-ti len-5 ti len=5 
m_len=4 
4 4 4 4 5 7 8 
rcv nxt : 0000 rcp_up 
ti_seq 4 
i t i_urp = 3 i rcv nxt 
0000020090 ti seg 
0 2920 9000000000 02921 1000000000 (ü O 29-20) 
718 mbu 105004 ti_len 
5 TCP_REASS tcp_reass 
( ) rcv nxt ti len ti len 5 
9 mbuf 
(m pkthdr.len)[]1 sbappend 
mbuf 
1299-1302 mbu cnt mbu 
mbu 
mbuf break panic 
29.9 00000000 
tcp input ( ) 






























































































































































































































































29-22 
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TCP/IP 2 
tcp input.c 
1094 dodata /* XXX */ PL 
1095 /* 
1096 * Process the segment text, merging it into the TCP sequencing queue, 
1097 * and arranging for acknowledgment of receipt if necessary. 
1098 * This process logically involves adjusting tp->rcv_wnd as data 
1099 * is presented to the user (this happens in tcp usrreq.c, 
1100 * case PRU RCVD). If a FIN has already been received on this 
1101 * connection then we just ignore the text. 
1102 * 
1103 if ((ti->ti len || (tiflags & TH_FIN)) && 
1104 TCPS_HAVERCVDFIN(tp->t_state) == 0) ( 
1105 TCP REASS (tp, ti, m, so, tiflags); 
1106 /* 
1107 * Note the amount of data that peer has sent into 
1108 * our window, in order to estimate the sender's 
1109 * buffer size. 
1110 Wi 
1111 len = so->so_rcv.sb_hiwat - (tp->rcv adv - tp->rcv_nxt); 
1112 } else { 
1113 m, freemim); 
1114 tiflags &= “TH FIN; 
1115 } i 
tcp input.c 
U 29-22 tcp input DO DO D ü D D D 0 0 0 0 D D 0 
1094-1105 
1) 0 FIN 
2) FIN 
TCP REASS ( ) 
ACK rcv nxt 
tcp_reass ( 
) 
(tiflags) 
tcp reass[|tiflags 0 FIN ( ) 
FIN LE 
1-1024 
1025-2048 FIN 
( 1025-2048) ACK FIN 
29-22 0 FIN 
TCP_REASS tcp_reass ti seq(2049[] FIN ) rcv nxt 
(DU tcp. reass 0(U 20) -23) TCP REASS tiflags 0 
FIN ( 29-10) FIN 
1106-1111 len 
8192(Net/3 ) TCP[] SYN 8192 
1-1024 29-23 TCP. REASS rcv nxt 
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rcv. nxt rcv. adv 
- 1025 - 8193 
[]29-23 DOO 8192000000000 1-04] 000 
len 1024 len 
29-15 max_sndwnd 
o len | Net/1]] [] len[] 
TCP max rcvd 





















































if (len » tp-»max rcvd) 


tp-»max rcvd = len; 




























































































































































































































































































































































































































































































































































































Net/1 max rcvd 
1112-1115 len 0 FIN FIN 
| mbuf[] [] FIN 
29.10 FEINT 
tcp input g 29-24 FIN 
tcp input.c 

1116 /* š pap 

1117 * If FIN is received ACK the FIN and let the user know 

1118 * that the connection is closing. 

1119 */ 

1120 if (tiflags & TH_FIN) { 

1121 if (TCPS HAVERCVDFIN(tp->t state) == 0) I 

1122 socantrcvmore (so); 

1123 tp->t flags |= TF_ACKNOW; 

1124 tp->rcv_nxt++; 

1125 } 

1126 switch (tp->t_state) { 

1127 /* 

1128 * In SYN_RECEIVED and ESTABLISHED states 

1129 * enter the CLOSE_WAIT state. 

1130 */ 

1131 case TCPS_SYN_RECEIVED: 

1132 case TCPS_ESTABLISHED: 

1133 tp->t_state = TCPS CLOSE WAIT; 

1134 break; i 

tcp input.c 
D 29-24 top input DO D Pap DH 000 
1. FIN 

1116-1125 FIN FIN 
socantrcvmore TF_ACKNOW ACK( 1 

























































































































































































792 ws n: China-pubıcom 
TET u] 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































rcv_nxt[] 1 FIN 
1126 FIN switch 
CLOSED[] LISTEN[] SYN SENT FIN 3 
| SYN FIN 
CLOSING[] CLOSE WAIT[] LAST ACK FIN 3 
FIN 
2. SYN RCVD[] ESTABLISHED 
1127-1134 | SYN RCVD[] ESTABLISHED FIN 
CLOSE WAIT 
SYN RCVD FIN 24-15 
LISTEN SYN 
FIN SYN SYN RCVD 
ACK FIN( FIN ACK 
29-2 ESTABLISHED ) 
29-25 FIN 
"ET Fr tep input.c 
1136 * If still in FIN WAIT 1 state FIN has not been acked so 
1137 * enter the CLOSING state. 
1138 */ 
1139 case TCPS FIN WAIT 1: 
1140 tp->t state = TCPS CLOSING; 
1141 break; 
1142 /* 
1143 * In FIN WAIT 2 state enter the TIME WAIT state, 
1144 * starting the time-wait timer, turning off the other 
1145 * standard timers. 
1146 * 
1147 case TCPS FIN WAIT 2: 
1148 tp->t state = TCPS TIME WAIT; 
1149 tcp canceltimers(tp); 
1150 tp->t_timer[TCPT_2MSL] = 2 * TCPTV_MSL; 
1151 soisdisconnected (so); 
1152 break; 
1153 /* 
1154 * In TIME WAIT state restart the 2 MSL time wait timer. 
1155 */ 
1156 case TCPS TIME WAIT: 
1157 tp->t_timer[TCPT_2MSL] = 2 * TCPTV MSL; 
1158 break; 
1159 H 
1160 H : š 
tcp_input.c 
U 29-25 tcp input WOO FINIOOOOOO 
3. FIN WAIT 1 
1135-1141 ACK FIN FIN WAIT 1 







































































































































































— FIN CLOSING 
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4. FIN_WAIT_2 
1142-1148 FIN TIME_WAIT FIN_WAIT_1 ACK 
FIN ( ) 24-15 0 FIN WAIT 1 | TIME WAIT 
[] 29-11 ACK FIN WAIT 2 | FIN 
TIME WAIT ACK[] FIN FIN WAIT 2 


































































































































































































5. TIME WAIT 































































































































































































































































































































































































































































































































































































































































































































































































1149-1152 [|] TCP TIME_WAITO I n MSL Ü 
| O ACK[] FIN 29-11 O FIN. WAIT 2l] [] [] ) 
6. TIME WAIT| 
1153-1159 TIME WAIT FIN 29-14 
TIME WAIT MSL 
29.11 90000 
29-26 tcp input 
dropafterack 
- I tcp input.c 
1161 if (so->so options & SO_DEBUG) 
1162 tcp trace(TA INPUT, ostate, tp, &tcp saveti, 0); 
1163 Ved 
1164 * Return any desired output. 
1165 */ 
1166 if (needoutput || (tp->t flags & TF ACKNOW)) 
1167 (void) tcp_output (tp); 
1168 return; 


1169 dropafterack: 




















































































































































































































































































































1170 få 
1171 * Generate an ACK dropping incoming segment if it occupies 
1172 * sequence space, where the ACK reflects our state. 
1173 * ` 
1174 if (tiflags & TH_RST) 
1175 goto drop; 
1176 m_freem(m); 
1177 tp->t flags |= TF_ACKNOW; 
1178 (void) tcp output (tp); 
1179 return; . 
tcp input.c 
U 29-26 tcp input 0090000900 
1. SO DEBUG 
1161-1162 SO DEBUG tcp trace 
28-7 IP[] TCP 
2. tcp. output 
1163-1168 needoutput (O 29-6 29-15) ACK 



























































































































































tcp output 








79 4 TCP/IP 


China-pubecom 
































































































































































































































































































































































































































































































































































































































































































































































































































































































































IH 020 
3. dropafterack 
1169-1179 | RST| H DD ACK([] [] RST OU DU 
| | mbuf|[|] tcp output [] ACK[] 
[] 29-27 tcp input 
- tcp input.c 
1180 dropwithreset: 
1181 PE 
1182 * Generate an RST, dropping incoming segment. 
1183 * Make ACK acceptable to originator of segment. 
1184 * Don't bother to respond if destination was broadcast/multicast. 
1185 “7 
1186 if ((tiflags & TH RST) || m->m_flags & (M_BCAST | M_MCAST) || 
1187 IN MULTICAST(ti->ti dst.s addr)) 
1188 goto drop; 
1189 if (tiflags & TH ACK) 
1190 tcp respond(tp, ti, m, (tcp seq) 0, ti-»ti ack, TH RST); 
1191 else { 
1192 if (tiflags & TH SYN) 
1193 ti->ti_len++; 
1194 tcp respond(tp, ti, m, ti->ti seq + ti->ti_len, (tcp sea) 0, 
1195 TH_RST | TH_ACK); 
1196 } 
1197 /* destroy temporarily created socket */ 
1198 if (dropsocket) 
1199 (void) soabort (so); 
1200 return; 
1201 drop: 
1202 JE 
1203 * Drop space held by incoming segment and return. 
1204 */ 
1205 if (tp && (tp->t inpcb-»inp socket->so options & SO DEBUG)) 
1206 tcp trace (TA DROP, ostate, tp, &tcp saveti, 0); 
1207 m freem(m); 
1208 /* destroy temporarily created socket */ 
1209 if (dropsocket) 
1210 (void) soabort (so); 
1211 return; 
1212 ) i 
tcp input.c 
0 29-27 tep input: 0 0 D U U D 0 0 
4. dropwithreset 
1180-1188 üt RST, IOLDI 00060 
RSTO 0000000 0RSTO O DD ORSTO O O ORSTO DOS 0000000000 U RST 
D 28-160 D 00000000 OG U 
IN MULTICAST II 
5. RSTEJ 000090 
1189-1196 RST | | || 10 ACKT D U | U U 
[] ACK 

















[] 29-28] RST 


































































































Chinaspubecom I 
























































0 00 RSTO 0 ( 
000000 DUU o OOOO uu 
HU ACK 00000000 0 TH RST 
DO ACK 0 0200000000 TH RST|TH ACK 














0 29-28 DORSTO 0000000 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































SYN([] 24-16) ACK[] tcp. respond 
6. 
1192-1193 SYN ti len 1 RST SYN 
1 SYN 
28-6 Internet PCB dropwithreset 
RST SYN([] 28-18) 10 18.14 
RST 
tcp_respond mbu RST 
mbu mbu 
7. 
1197-1199 28-7 28-16 
U HOOD drop socket 
8. ( ACK[] RST) 
1201-1206 ACK[] RST tcp trace 
SO DEBUG ACK tcp_output 
SO_DEBUG RST RST 
1207-1211 mbu dropsocket 
29.12 0000 
TCP UDP (23.12] ) 0 
[Dalton et al. 1993] 
TCP PCB 10000 [McKenney and Dove 1992] 
[Partridge 1993] Van Jacobson 
TCP IP (RISC 25 ) 
(demultiplexer) PCB([] 10 ) TCP (O 30 ) 30 
LU LU TCP ( [ 
) TCP TCP 
2913 DOOD 








TCP TCP TCP 

















































































































































































































79 6 TCP/IP 2 
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RFC 1144[Jacobson 1994a] 
Van Jacobson VJ 
(RFC 1144 tcp output 
) (28.4[] ) 
29.13.1 0 
SLIP[] PPP 
TCP — IP ICMP 
IGMP|[] UDP ) IP/TCP| 40 3 
Telnet[] TCP 41 4 
256 16 16 
TCP 8 bit ID( 
256) / 96 bit 
— IP TCP IP TCP — 
29-29 
TCP 
29-29 
ID 1 IP 128.1.2.3 TCP 
1500 IP 192.3.4.5 TCP 25 ID 
2 
. DDD0000 O000000 
no D 000 IP/TOPO O OO nu U D 0 IP/TCP[] D 
0 
1 
E3 











O000000 
DB DD I d p (Br TCPD D 














Doc 









00000 


000 IP/TCPO O 
x |(92345.25. 1281.25, 1500) | 


pr gu o 


D 29-29 00 (SEP) D0O000000000 


D U 





















AUTO) 
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29 TCP (U) 
29-29 
( ) 
IP[] TCP — TCP 
29-30 | IP 
0000 IP 
000 










D TCPI D 0 0 D 
000 TCPD D 





00000000 
O O 96-bit0 O O 
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l TTT UNCOMPRESSED_TCP[] 
IP/ TCPO 
0 2930 IOO0O0000000000 
3 
1) IP 4 4 IP IP (O 8-8) 
2) COMPRESSED_TCP 1 IP 80 15 
( Tbit ) 
3) UNCOMPRESSED TCP 4 
IP ( 6 TCP) ID 
5-13 5- 
16 sl_compress_tcp TCP 
29-31 4p " -" IP 7 
cp 10 PO SO AO w[] E" | 




































































































































































































































































798 TCP/IP 2 China-bubıtoM 
—— 





U D DD D 0 1 0 O - - - - Ip 
0000 0 1 1 1 - - = - UNCOMPRESSED TCP 
1 C ISP S A W U COMPRESSED TCP 
129-3131 [000000000 
29-32 IP 





















































































































































r3 

O 
£ 
= 
EN 
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IPD D D 









O TCPO n 0-655150 00 PO D 


ds ja- 20-600 I O IPO O - 


TCPO D 0100 000 TCP 20-600 0 0 TCPO O 0-654950 0 0 TCPO 0 
a 20-600 O O IPO O > 


UNCOMPRESSED TOP; 0111) 00000 Im 20-600 D 0 TCPO D 0-654950 D [] TCPO O 
COMPRESSED_TCP: CNN 0-654950 D D TCPO D 


3-160 0 . 
D DA ree N 








































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































p 2932 )OO0O0000000000P000 
IP | TCP (U UDP[] ICMP[] IGMP 
) 000 TCP 0 [ IP | TCP | 
UNCOMPRESSED_TCP | TCP | 4 
IP 
IP TCP TCP 

. IP 

e SYN] FIND RST IB O 

* ACK 

3 IP 

TCP 

UNCOMPRESSED_TCP 
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a*pubecom 0290 TDD 010 799 


0000 655350000000000 





29132 0008010 


OOO00000002933000P0T7EOOO00000000000000000 
OOO00000000000 


0 15 16 31 


4-bit 4-bit | 8-bit — 
Ooo (0000 0000 os) = 
8-bit[] 0 O O (TTL) 16-bit] 0000 200 0 


32-bit[] IPO Å 


32-bit[] I IPO [J 


16-bit] D D D 16-bit[] O0 0 00 


32-bit[] [] 


32-bit OOO 200 D 


: UJAIPEPIS 
4-bit[] [] n D 6 bit) RICESES|Y 16-bit] OOO 
00 GIKÄHETIN 


16-bit TCPO DD | 16-bitI 0 0 D 





0 29-33 000 POTCEQOOOOOODOOOOOO 


OO0OOO0O000000000000000000000000000000000 
OOO00000000000000 POTEOOODODOOOOOOOOOOOOOOO 
OOO000000000000000000 002970 

OOO0000000000000000000000000 50%0 00000 vi 
OOO000000002934Q000001P/TeJI000 

U U 0 0 0 D U IP'TCGPD O00 3000000000 (0 0 0 0 70 D 16 bit] TCP] [| 
U U D 00 000 DU 000 000 DU 0 TCPpD 0 (SLIP 0 0 0 0 0 0 00 000 U 
PPPO DUDU 00 


800 
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poo 111 C [e[s [afefe] O00000000000000 
0,1! connid (C) i 00 cn :0 01D 
2 TCPO H Hn H 16- bit TCPO HB nn D 
0,1,3! urgoff (U) | KA aaa 
PE ze s= =] 
0,1,31 Awin (W) ! ID WO ıreeononnon 
l — t pet Meg i iama. — — — == 
0,1,31 Aack (A) | 0 AD LTCPDD 000 7 
G Stee a 
0, 1,3) Aseq (S) | DO SI rTCPD O00 
ba dere M 
0,1,3 Aipid (D ı 0010 1P00000 
uu 
0 29-34 0000 wrergogog 
6 connid|] urgoff[] Awin[] Aack[] Aseq[] Aipid] [] [| 29-34 
19 
4 bit[] SAW 16 
1 COMPRESSED TCP 
bit 6 29-35 7 bit 
DU D D D U [] OOOO U D 0 D 00 0 0000100 
C O O ID O0 DO 0 connid=[] [] ID 
I IP[] [] Ü ip_id ip idg [| 1 Aipid=IP[] 0000 
P TCPO OO PSH[ ODO PSHED OOO 
S TCPO 0 th seq th sega J Aseq=TCP|[] O00 
A TCP] 0 0 O th_ack th ack[] [] Aack=TCP] 000090 
W TCPO 0 th win th wing U Awin=TCO 00000 
U TCP[] D D D D 0 0 th urg URGO 0000 urgoff-[] 000000 
029-35 DOOO00 70000 
C C 0 ( ) 
ID 1 connid ID 0-255 
I I 0 IP 1( ) 
Aipid|] [| ip id 
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P TCP PSH PSH 
S S OL] TCP 11] Aseq th_seq 
A A oO TCP ( ) 10] Aack th_ack 
W OL] TCP 11] Awin th_win 
U 0 URG ( ) 
1 URG urgoff| th urg URG 
( 
) 
(Awin ) 
29-34 5 00 1[] 3 
0 
1 1-255 1 
3 0 256-65535 3 
0 3[] 16 bit urgoff] Awin[] Aipid 
32 bit Aack|] Aseq 0 65535 
29-33 29-34 
« IP 
. IP 16 bit[] IP IP 
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29.13.3 
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( 4 10110 1111) 
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20-3 | 
29.13.4 DI 
1-17 bsdi[] slip SLIP 
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A) Ü 
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bsdill slip 
(FTP) 29-36 
DU aut FTP 
UH D 0 DO DO DU 
UNCOMPRESSED_TCP 3 2 2 3 
COMPRESSED_TCP 
0000 *sa 75 75 0 0 
0000 *s 25 1 1 325 
uuu 9 93 337 13 
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029-36 QOOUU FTPO0000000000000000 
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325 
FTP] [] IP 0 10 4 SYN ule FIN 
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UNCOMPRESSED_TCP ID 
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29-37 4 3.1 
4.1[] 6.0[] 3.3 40 
FTP 6 325 
256[] Aack 256 255 3 SLIPMTU 296 
TCP 256[] MSS FTP 3 250 
* S ( ) 256 *S 
TCP FTP 78 
4 IP ( 29.8) 
29.13.5 
SLIP[] PPP SLIP 
ifconfig 
linkO[] link2 ( ) 
( ) 
TCP UNCOMPRESSED TCP ID 
( ) 
PPP 
29.14 DUO 
TCP SYN RCVD 
ACK 
TCP ACK 
Net/3 
ACK ACK 
TCP 
URG TCP 
TCP URG 
TCP TCP_REASS 
FIN tcp_output 
TCP SLIP[] PPP IP[] TCP 40 
3-6 ( ) 



















































































































































































































































































































































































































































































804 


U U 


29.6 


29.7 
29.8 
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TCP/IP [ 2 
Net/3[] OM u SYN L U 500 d U U 
50 | SYN/ACK 
EIN L L 
Net/3 0 SYND l] SYN/ACK LU 500] u 
FIN TCP 
1 18-19[] RFC 793 14 4 
0 O Neu? u U U UU Net/3 0 
= 00006 BE w - = =: 
uu FIN 0000 FIN utut 
RFC 793[] 72 Ë 
( ‘OK’ )” 
Net/3[] [| 
RFC 1323 TCP 
Net/3[] IP TCP MONE 
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U 300 TOPHUUUO 


30.1 [Il 


0000 TePO 00000000 tepusrres 000000 pr usrreqt 00000 
U U 00 TCP 0000000000000000 tep_etloutputl LU DD tt 
setsockopt| TCP [| [] 























































































































30.2 tcp_usrreq[] |] 











































































































TCPD D U D D D 0 D 0 U D 00 D U U 0 30-1000 tep sr reda) UD U U U 0 D 
U U switch U D D U 0 0 0 DD U 0 0 DDD U U 15170 0000000000000 
nnnnpmnnnnnnnn 

"em tcp usrreq.c 


46 tcp usrreq(so, req, m, nam, control) 
47 struct socket *so; 


48 int req; 

49 struct mbuf *m, *nam, *control; 

50 I 

51 struct inpcb *inp; 

52 struct tcpcb *tp; 

53 int s; 

54 int error = 0; 

55 int ostate; 

56 if (req == PRU_CONTROL) 

57 return (in_control(so, (int) m, (caddr_t) nam, 

58 (struct ifnet *) control)); 

59 if (control && control->m_len) ( 

60 m freem(control); 

61 if (m) 

62 m freem(m); 

63 return (EINVAL); 

64 } 

65 s = splnet (); 

66 inp = sotoinpcb (so); 

67 ja 

68 * When a TCP is attached to a socket, then there will be 
69 * a (struct inpcb) pointed at by the socket, and this- 
70 * structure will point at a subsidary (struct tcpcb). 
71 */ 

72 if (inp == 0 && req != PRU ATTACH) ( 

73 splx(s); 

74 return (EINVAL); /* XXX */ 

75 } 

76 if (inp) { 

77 tp = intotcpcb(inp); 


U 30-1 tcp usrreq DUU 


806 zero 02000 China-pupco 


78 /* WHAT IF TP IS 0? */ 
79 ostate = tp->t_state; 
80 } else 

8i ostate = 0; 


82 switch (req) { 















































































































































































































































































































= 


276 default: 





277 panic("tcp usrreq"); 

278 } 

279 if (tp && (so->so_options & SO DEBUG)) 

280 top trace(TA USER, ostate, tp, (struct tcpiphdr *) 0, req); 
281 splx(s); 

282 return (error); 

283 3 





tcp_usrreq.c 
0 30-1 (0) 


l. in control ]l ioct1] 0 
45-58 PRU_CONTROL[ | 000 ioct10 000000 in control 00000000 

2. 000000 
59-64 000000 sendmsgf I TCP AO D 0 D D 0 D 0 0 D 0 D U mbut O00 
EINVAL[][] D 0 0 C] C] 0000000 
65-66 Q00000 spinet 00000000000 D 0 0 D 00 D D 0 0 0 D 0 0 U 
OOOOU0 cas DD 0 DUDU splnetQ 0000 23-15 0 D D O DD spinet J D 
U D D 0 0 DD D 0 0 0000 DDD DD 0 0 IP DDD (000000 tep_input)OD 
OOOOO0000000000000000P0000000 

U U DD D 0 0000 00 DDD 0 D Internet PBYOOOOOOOOOOOO 
socket 0 00000 PRU_ATTACHU 0 D D B D 0 D D D D LI U 
67-81 00 inPd 000000000000 ostate 0 D 0 0 D 0 D 0 D 0 0 D U 
tcp trace] 

U D D 0000 case 0 0 DD 000 socket] DD D 0 D D DI D 0 D 
000000 (0128-70 0 O sonewconn 0000000 PRU_ATTACHO 000 30-20 O 
U U DD 0 00000 U 


aaa ICH usrreg.c 


83 /* 

84 * TCP attaches to socket via PRU ATTACH, reserving space, 
85 * and an internet control block. 
86 */ 

87 Case PRU ATTACH: 

88 if (inp) ( 

89 error - EISCONN; 

90 break; 

91 } 

92 error = tcp_attach(so); 

93 if (error) 


[] 30-2 tcp usrreq [|] [| [| PRU ATTACH [] PRU DETACH [] JJ 
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94 break; 
95 if ((so-»so options & SO LINGER) && so->so_linger == 0) 
96 so->so_linger = TCP_LINGERTIME; 
97 tp = sototcpcb (so); 
98 break; 
99 /* 
100 * PRU DETACH detaches the TCP protocol from the socket. 
101 * If the protocol state is non-embryonic, then can't 
102 * do this directly: have to initiate a PRU DISCONNECT, 
103 * which may finish later; embryonic TCB's can just 
104 * be discarded here. 
105 ES 
106 case PRU_DETACH: 
107 if (tp->t_state > TCPS_LISTEN) 
108 tp = tcp_disconnect (tp); 
109 else 
110 tp = tcp close(tp); 
111 break; 
IT — — — — cp, usrreg.c 
DU 30-2 (J) 
3. PRU ATTACH 
83-94 | | PCB | D EISCONN tcp_attach 
Internet PCB[] TCP 
95-96 SO LINGER 0 120 
(TCP LINGERTIME) 
PRU ATTACH 
socket | | sonewconn PRU ATTACH 
so options PRU ATTACH 
O[] SO LINGER 
TCP LINGERTIME[| tcp timer.h 
120 d 2 Ñ SO LINGER tsleep 
(|| soclose ) timeout 
(hz) 100 1.2 
2 
97 tp TCP SO_DEBUG 




























































































































































































4. PRU_DETACH 

















































































































































































































































































































































































































































































































































































































99-111 close PRU_DISCONNECT PRU_DETACH 
( ESTABLISHED) 
tcp_disconnect TCP ( 
FIN) 
xf LISTEN 
SYN SENT SYN RCVD| LISTEN tcp disconnect 
tcp close case tcp disconnect 
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30-3 bind[] listen 
tcp_usrreq.c 
112 /* 
113 * Give the socket an address. 
114 */ 
115 case PRU, BIND: 
116 error = in pcbbind(inp, nam); 
117 if (error) 
118 break; 
119 break; 
120 FE I 
121 * Prepare to accept connections. 
122 */ 
123 case PRU LISTEN: 
124 if (inp->inp lport == 0) 
125 error = in_pcbbind(inp, (struct mbuf *) 0); 
126 if (error == 0) 
127 tp->t state = TCPS LISTEN; 
128 break; ep usrreg.c 
O 30-3 tcp usrreg U [| [| PRU BIND [| PRU LISTEN [0 
112-119 PRU BIND in pcbbind 
120-128 PRU LISTEN 
in pcbbind 
RPC( ) Port Mapper 
(U 1] 29.4 Port Mapper) LISTEN listen 
( ) 
30-4 connect 
























































































































































dog 2 ep usrreq.c 


129 /* 

130 * Initiate connection to peer. 

131 * Create a template for use in transmissions on this connection. 
132 * Enter SYN SENT state, and mark socket as connecting. 
133 * Start keepalive timer, and seed output sequence space. 
134 * Send initial segment on connection. 

135 */ 

136 case PRU CONNECT: 

137 if (inp->inp_lport == 0) { 

138 error = in pcbbind(inp, (struct mbuf *) 0); 

139 if (error) 

140 break; 

141 ) 

142 error = in pcbconnect(inp, nam); 

143 if (error) 

144 break; 

145 tp->t template = tcp template(tp); 

146 if (tp->t template == 0) ( 

147 in_pcbdisconnect (inp); 


error = ENOBUFS; 


O 30-4 tcp usrreg U [| [| PRU CONNECT DI 
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149 break; 
150 } 
151 ./* Compute window scaling to request. */ 
152 while (tp-»request r scale « TCP MAX WINSHIFT && 
153 (TCP MAXWIN << tp->request r scale) « so->so_rcv.sb_hiwat) 
154 tp->request r scale++: 
155 soisconnecting (so); 
156 tcpstat.tcps_connattempt++; 
157 tp->t_state = TCPS_SYN_SENT; 
158 tp->t_timer[TCPT_KEEP] = TCPTV_KEEP_INIT; 
159 tp->iss = tcp_iss; 
160 tcp iss += TCP_ISSINCR / 2; 
161 tcp_sendseginit (tp); 
162 error = tcp_output (tp); 
163 break; 
tcp usrreq.c 
D 30-4 (0) 
5. 
129-141 ip_pcbbind 
6. PCB 
142-144 in_pcbconnect 
yA IP[] TCP 
145-150 tcp_template mbu IP[] TCP 
mbu 
8. 
151-154 65535(TCP_MAXWIN) 
(so_rcv.sb_hiwat) (0-14 ) SYN 
(U 28-7 ) connect 
SO_RCVBUF TCP SYN | 
(U 24-3 tcp_recvspace) 
9. 
153-138 soisconnecting TCP 
SYN_SENT tcp_output SYN( 24-16[] tcp_outlagsl] ) 
75 tcp output SYN 25-16 
10. 
159-161 tcp_iss tcp_iss 64 000 
(TCP ISSINCR 2) SYN ISSO ( 28-17) tcp iss 
tcp sendseqinit 
11. SYN 
162 tcp output SYN tcp output ( mbuf 
) tcp usrreq 
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30-5 PRU_CONNECT2|| PRU_DISCONNECT|| PRU ACCEPT U U U 
164-169 PRU_CONNECT2 socketpair TCP 
170-183 close [| PRU_DISCONNECT| o | o 
tcp disconnect FIN O TCP 
tcp. usrreg.c 

164 /* p- q 

165 * Create a TCP connection between two sockets. 

166 */ 

167 case PRU_CONNECT2: 

168 error = EOPNOTSUPP; 

169 break; 

170 /* 

171 * Initiate disconnect from peer. 

172 * If connection never passed embryonic stage, just drop; 

173 * else if don't need to let data drain, then can just drop anyway, 

174 * else have to begin TCP shutdown process: mark socket disconnecting, 

175 * drain unread data, state switch to reflect user close, and 

176 * send segment (e.g. FIN) to peer. Socket will be really disconnectec 

177 * when peer sends FIN and acks ours. 

178 k 

179 * SHOULD IMPLEMENT LATER PRU CONNECT VIA REALLOC TCPCB. 

180 */ 

181 case PRU_DISCONNECT: 

182 tp = tcp disconnect (tp); 

183 break; 

184 /* 

185 * Accept a connection. Essentially all the work is 

186 * done at higher levels; just return the address 

187 * of the peer, storing through addr. 

188 */ 

189 case PRU_ACCEPT: 

190 in_setpeeraddr (inp, nam); 

191 break; 

tcp_usrreq.c 
O 30-5. tcp usrreg [ [| [| PRU CONNECT2 [| PRU DISCONNECT [| PRU ACCEPT UI 
“ [] ” L 
connect 
connect | | socket utu 
connect[] 
184-191 accept[] | | | PRU_ACCEPT 
0000000 IP | i 
30-6 | [| PRU_SHUTDOWN[] PRU. RCVD[] PRU. SEND 
12. PRU. SHUTDOWN[] 
















































































































































































































































































192-200 | shutdown] |] g soshutdown 
PRU_SHUTDOWN socantsendmore | | | 
tcp usrclosed 24-15 tcp output 
FIN 
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tcp_usrreq.c 
192 LE RN 1 
193 * Mark the connection as being incapable of further output. 
194 */ 
195 case PRU_SHUTDOWN: 
196 socantsendmore (so); 
197 tp = tep_usrclosed(tp); 
198 if (tp) 
199 error = tcp output (tp); 
200 break; 
201 /* 
202 * After a receive, possibly send window update to peer. 
203 */ 
204 case PRU_RCVD: 
205 (void) tcp output (tp); 
206 break; 
207 /* 
208 * Do a send by putting data in output queue and updating urgent 
209 * marker if URG set. Possibly send more data. 
210 *7 E 
211 case PRU SEND: 
212 sbappend (&so->so_snd, M); 
213 error = tcp output (tp); 
214 break; 
tcp usrreq.c 
O 30-6 tcp usrreq [][][] PRU SHUTDOWN [| PRU RCVD [| PRU SEND [] [J 
13. PRU. RCVD 
201-206 Soreceive 
TCP tcp output 
14. PRU. SEND 
207-214 23-14 5 sbappend 
( ) tcp output 
( ) 
30-7 PRU_ABORT|| PRU SENSE 
215 7 tcp. usrreg.c 
216 * Abort the TCP. 
217 */ å 
218 case PRU ABORT: 
219 tp = tcp drop(tp, ECONNABORTED) ; 
220 break; 
221 case PRU SENSE: 
222 ((struct stat *) m)->st blksize = so->so snd.sb hiwat; 
223 (void) splx(s); 
224 return (0); 
tcp_usrreq.c 








[] 30-7 tcp usrreq [|] J] [| PRU ABORT [| PRU SENSE [| [| 











15. PRU ABORT 
215-220 ( ) 
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TCP/IP 2 
SYN accept soclose 
PRU_ABORT tcp_drop RST 
16. PRU_SENSE 
221-224 fstat PRU_SENSE TCP 
stat st_blksize 
30-8 PRU_RCVOOB MSG_OOB 
soreceive 
tcp_usrreq.c 
225 case PRU_RCVOOB: P- 1 
226 if ((so->so_oobmark == 0 && 
227 (so->so_state K SS RCVATMARK) == 0) [| 
228 So-»so options & SO OOBINLINE || 
229 tp->t_oobflags & TCPOOB HADDATA) ( 
230 error = EINVAL; 
231 break; 
232 } 
233 if ((tp->t_oobflags & TCPOOB_HAVEDATA) == 0) { 
234 error = EWOULDBLOCK; 
235 break; 
236 } 
237 m->m len = 1; 
238 *mtod(m, caddr_t) = tp->t_iobc; 
239 if (((int) nam & MSG PEEK) == 0) 
240 tp->t oobflags “= (TCPOOB HAVEDATA | TCPOOB HADDATA) ; 
241 break; 
tcp usrreg.c 
O 30-8 tcp usrreq [ U [| PRU RcvooB [] [J 
17. 
225-232 3 
1) (so oobmark) 0 SS RCVATMARK 
2) SO OOBINLINE 
3) TCPOOB HADDATA ( ) 
3 EINVAL 
18. 
233-236 3 TCPOOB HAVEDATA TCP 
1 (O 29-17) 
EWOULDBLOCK 
1 26-7 
19. 
237-238 tcp pulloutofband t_iobc 
20. 
239-241 ( MSG PEEK 
)[] TCP HAVE HAD case 
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HAVE HAD HAD 
HAD (U 29-17) 
tp->t oobflags = TCPOOB HADDATA; 
t oobflags Net/3 
30-9 PRU SENDOOB MSG OOB sosend 
tcp_usrreq.c 
242 case PRU_SENDOOB: 
243 if (sbspace(&so->so snd) < -512) { 
244 m freem(m); 
245 error - ENOBUFS; 
246 break; 
247 } 
248 /* 
249 * According to RFC961 (Assigned Protocols), 
250 * the urgent pointer points to the last octet 
251 * of urgent data. We continue, however, 
252 * to consider it to indicate the first octet 
253 * of data past the urgent section. 
254 * Otherwise, snd up should be one lower. 
255 */ 
256 sbappend (£so->so_snd, m); 
257 tp->snd_up = tp->snd_una + so->so_snd.sb_cc; 
258 tp->t_force = 1; 
259 error = tcp_output (tp); 
260 tp->t_force = 0; 
261 break; 
tcp usrreq.c 
O 30-9 tcp usrreg [] [| [| PRU sENbooB DI 
21. 
242-247 
512 
1024 ([] 16-24) sbappend 
22. 
248-257 (snd, up) 26-30 
3 MSG OOB 
MSG OOB 1 
23. TCP 
258-261 t force 1 tcp output TCP 
URG 1 26-7 
30-10 3 
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tcp_usrreg.c 

262 case PRU_SOCKADDR: SS 1 

263 in_setsockaddr (inp, nam); 

264 break; : 

265 case PRU_PEERADDR: 

266 in_setpeeraddr(inp, nam); 

267 break; 

268 /* 

269 * TCP slow timer went off; going through this 

270 * routine for tracing's sake. 

271 */ 

272 case PRU, SLOWTIMO: 

273 tp - tcp timers(tp, (int) nam); 

274 req |- (int) nam << 8; /* for debug's sake */ 

275 break; 

tcp usrreg.c 
O 30-10 tcp usrreq [][] [| PRU SOCKADDR [| PRU PEERADDR [| PRU_SLOWTIMO [0 
262-267 getsocknamell getpeername PRU_SOCKADDR 
PRU_PEERADDR in setsockaddr[| in_setpeeraddr PCB 
addr 
268-275 tcp_slowtimo PRU_SLOWTIMO U 0 
tcep_slowtimol|] |] tcp timers 
tcp trace ([] 30-1) 4[] TCP 
tcp_slowtimo nam t_timer (U 25-1) 8 
(req) trpt 



















































































































































































30.3 tcp_attach|[| |] 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































tcp_attach PRU_ATTACH ( 
) tcp_usrreq 30-11 
1. 
361-372 sbreserve 8192 
tcp sendspace[] tcp recvspace ([] 24-3) 
MSS MTU 
[Comer and lin 1994] 3 MSS 
O O O 61 444 U 
MTU([] FDDI[] ATM) 
2: Internet PCB[] TCP 
373-377 in pcballoc Internet PCB tcp_newtcpcb TCP[] [| 0 
PCB 
378-384 tcp_newtcpcb malloc " XXX" 
PRU ATTACH 0 (sonewconn) 
| | SS_NOFDREF in pcballoc[] 
sofree | tcp input 0 
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([] 29-27 dropsocket ) 
in pcbdetach SS NOFDREF nofd 
tcp attach 
385-386 TCP CLOSED 
tcp usrreg.c 
361 int We q 
362 tcp_attach(so) 
363 struct socket *so; 
364 { 
365 struct tcpcb *tp; 
366 struct inpcb *inp; 
367 int error; 
368 if (so->so_snd.sb_hiwat == 0 || so->so rcv.sb hiwat == 0) { 
369 error = soreserve(so, tcp_sendspace, tcp_recvspace); 
370 if (error) 
371 return (error); 
372 } 
373 error = in_pcballoc(so, £tcb); 
374 if (error) 
375 return (error); 
376 inp = sotoinpcb (so); 
377 tp = tcp newtcpcb(inp); 
378 if (tp == 0) ( 
379 int nofd = so-»so state € SS NOFDREF; /* XXX */ 
380 SO-»80 state &= ~SS_NOFDREF; /* don't free the socket yet */ 
381 in pcbdetach(inp); 
382 so->so state |= nofd; 
383 return (ENOBUFS); 
384 } 
385 tp->t_state = TCPS_CLOSED; 
386 return (0); 
387 > 
tep usrreg.c 
0 30-11 tcp attach 0000000 TCP|[J [] 
30.4 tcp_disconnect|] [| 
30-12 tcp_disconnect TCP 
1. Ú 
396-402 ESTABLISHED (O LISTEN[] SYN SENT[] SYN. RCVD) 
tcp_close PCB[] TCP 
2. 
403-404 SO_LINGER (SO_LINGER) 
tcp_drop TIME_WAIT CLOSED 
RST PCB[] TCP close PRU_DISCONNECT 
SO_LINGER soclose 
3. 
405-406 SO LINGER 































































































































































































816 
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TCP/IP 2 
TCP soisdisconnecting 
396 struct tcpcb + tcp usrreg.c 
397 tcp disconnect (tp) 
398 struct tcpcb *tp; 
399 ( 
400 struct socket *so = tp-»t inpcb-»inp socket; 
401 if (tp-»t state < TCPS ESTABLISHED) 
402 tp - tcp close(tp); 
403 else if ((so-»so options & SO LINGER) && so-»so linger == 0) 
404 tp - tcp drop(tp, 0); 
405 else ( 
406 soisdisconnecting (so); 
407 sbflush(&so-»so rcv) n 
408 tp - tcp usrclosed(tp); 
409 if (tp) 
410 (void) tcp output (tp); 
411 H 
412 return (tp); 
413 ) 
tcp usrreq.c 
U 30-12 tcp discomect 0000000 TCPO DO 
4. 
407 sbflush 
tcp output Ñ N 
TCP 
TCP ( ) 
5. 
408-410 tcp_usrclosed 
FIN WAIT 1 ESTABLIDHED 
tcp usrclosed (tp) 
tcp output ESTABLISHED 
FIN WAIT 2 FIN 
30.5 tcp usrclosed[] [] 
30-13 PRU, SHUTDOWN tcp disconnect 
1. SYN 
429-434 SYN FIN CLOSED 
tcp close Internet PCB[] TCP 
2. FIN WAIT 1 
435-438 SYN RCVD[] ESTABLISHED 
FIN. WAIT 1 | [| tcp. output[] FIN([] 24-16[] [| tcp. outflags[] ) 
3. LAST ACK 
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439-441 CLOSE_WAIT LAST_ACK 
tcp output FIN 
443-444 FIN WAIT 2[] TIME WAIT[] soisdisconnected 
| | U 
tep usrreg.c 


424 struct tcpcb * 
425 tcp_usrclosed(tp) 
426 struct tcpcb *tp; 


427 I 

428 switch (tp->t state) { 

429 case TCPS CLOSED: 

430 case TCPS LISTEN: 

431 case TCPS SYN SENT: 

432 tp->t state = TCPS CLOSED; 

433 tp = tcp close(tp); 

434 break; 

435 case TCPS SYN RECEIVED: 

436 case TCPS ESTABLISHED: 

437 tp-»t state - TCPS, FIN WAIT 1; 

438 break; 

439 case TCPS CLOSE WAIT: 

440 tp->t state = TCPS LAST ACK; 

441 break; 

442 } 

443 if (tp && tp->t_state >= TCPS_FIN_WAIT_2) 
444 soisdisconnected (tp->t_inpcb->inp_socket); 
445 return (tp); 

446 } 





tcp_usrreq.c 


0 30-13 tcp usrclosed JPD00000000000000000000000 


30.6 tcp ctloutput[] [| 

















































































































































































































































































































tcp ctloutput getsockopt|| setsockopt 
TCP level SOL SOCKET 30-14 TCP 
I 0 U U [] I DU U [] 
TCP NODELAY t flags DDD Nagel] [ (O 26-8) 
TCP_MAXSEG t_maxseg [Ut TCPH 0000000000 




















0 30-14 TCP D 0 0 0 0 D 



















































































30-15 
TREE top usrreg.c 
285 tcp_ctloutput (op, so, level, optname, mp) 
286 int op; 
287 struct socket *so; 
288 int level, optname; 


DH 30-15 tcp_ctloutput 0000000 


618 
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TCP/IP 2 
289 struct mbuf **mp; 
290 { 
291 int error = 0, s; 
292 struct inpcb *inp; 
293 struct tcpcb *tp; 
294 struct mbuf *m; 
295 int i; 
296 s = splnet(); 
297 inp = sotoinpcb (so); 
298 if (inp == NULL) { 
299 splx(s); 
300 if (op == PRCO_SETOPT && *mp) 
301 (void) m free(*mp); 
302 return (ECONNRESET); 
303 } 
304 if (level != IPPROTO_TCP) { 
305 error = ip_ctloutput (op, so, level, optname, mp); 
306 splx(s); 
307 return (error); 
308 } 
309 tp = intotcpcb(inp); 
tcp_usrreq.c 
O 30-15 (O) 
296-303 splnet[] inp Internet PCB inp 
mbuf| 
304-308 level(getsockopt[] setsockopt | ) 
IPPROTO TCP (O IP) TCP IP 
IP TCP[] ip ctloutput 
309 TCP tp TCP 
switch PRCO SETOPT([] 30-16[] 
) PRCO GETOPT([] 30-17 ) 
tcp usrreg.c 
310 switch (op) { ER 4 
311 case PRCO_SETOPT: 
312 m = *mp; 
313 switch (optname) { 
314 case TCP_NODELAY: 
315 if (m == NULL || m->m len < sizeof(int)) 
316 error = EINVAL; 
317 else if (*mtod(m, int *)) 
318 tp->t flags |= TF NODELAY; 
319 else 
320 tp->t flags &= ~TF_NODELAY; 
321 break; i 
322 case TCP_MAXSEG: 
323 if (m && (i = *mtod(m, int *)) > 0 && i <= tp->t_maxseg) 
324 tp->t_maxseg = i; 
325 else 
326 error = EINVAL; 
327 break; 


D 30-16 tcp ctlouteet 000000000 
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328 default: 
329 error = ENOPROTOOPT; 
330 break; 
331 } 
332 if (m) 
333 (void) m free (m); 
334 break; 
tcp usrreg.c 
D 30-16 (0) 
315-316 m mbuf | setsockopt g 0 TCPO [| 
mbuf mbuf mbu 
1. TCP_NODELAY 
317=321 TF NODELAY 26-8 Negal 
0 Negal ( ) TF NODELAY 
2. TCP MAXSEG 
322-327 | O O MSS[] TCP | tcp. newtcpcb t maxseg 
512 SYNU U [| [| MSS tcp input tcp mss[] t maxseg 
MTU( 40 IP[] TCP ) 1460 
512 MSS 
tcp_mss | U MSS 
4.4BSD MSS 
getsockopt MSS 
3. mbuf 
332-333 mbu 
30-17 PRCO GETOPT 
tcp, usrreq. 
335 case PRCO GETOPT: nis d 
336 *mp = m = m get (M WAIT, MT SOOPTS); 
337 m->m len = sizeof(int); 
338 switch (optname) ( 
339 case TCP NODELAY: 
340 *mtod(m, int *) - tp-»t flags & TF NODELAY; 
341 break; 
342 case TCP MAXSEG: 
343 *mtod(m, int *) - tp-»t maxseg; 
344 break; 
345 default: 
346 error - ENOPROTOOPT; 
347 break; 
348 } 
349 break; 
350 } 
351 splx(s); 
352 return (error); 
353 } 
tcp usrreg.c 





D 30-17 tcp ctloutput 000000000 


820 c 
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2 
335=337 TCP m_get 
mbu 
339-341 TCP NODELAY TF NODELAY ( Nagel 
Ou 0 TF_NODELAY 
342-344 TCP_MAXSEG t_maxseg PRCO_SETOPT 
30.7 00 
tcp_usrreg PRU. xxx 
TCP 
tcp_ctlsockopt 0 0 TCP[] 0 Nagel 
U U 
30.1 TCP | socket 
connect write ( JU read ) 
TCP 
30.2 SO LINGER 0 close 
tcp disconnect RST 
0 (kill) close 
RST 
30.3 25-4 TCP_LINGERTIME " SO LINGER = 
30-2 | 
30.4 Net/3 socket[] connect 
1 129 
30.5 1 C sock 
(-p) 
tcpdump TCP“ 0 i 
ACK ACK 
30.6 SO KEEPALIVE 
30.7 RFC 1122 TCP RST Net/3 























































































































































































































ipsu tt 


0310 BPFOBSDO 0 0 0 0 U 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































31.1 HH 
BSD (BPF) | | | 
= N /dev/bpf0]] /dev/bp£10 0 BPF 
BPF 
BPF 8192 BPF 
open EBUSY BPF 
open 
ioctl BPF 
BPF 
“ ” “ ” BPF 
BPF BPF 3 SLIP 
bpfattach BPF 
BPF 
BPF 1 A tcpdump 
TCP BPF 
BPF 
bpf(4)[] [McCanne and Jacobson 1993] 
31.2 FOND 
BPF C 31-1 
U [] [] Ë 
net/bpf.h BPF[] [] 
net/bpfdesc.h BPF[] D 
net/bpf.c BPF[] D D 
031-1 [000000 
31.2.1 UD 
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bpf_bufsize 





int 








TCP/IP 2 
0 H DU D 0 0 p 0 
bpf_iflist struct bpf_if * OO BPOOOOOOOO 
bpf dtab struct bpf_d [] BPH[] D 0 0 


BP D D 0 0 D DÚ 











0312 00000000 






































































































































































































































31:22 DAG 
31-3 bpf d BPF 
bpf I 000 U [] 
bd rcount O000000000000 
bd dcount O0000000000000000 
D3? JO000000 
BB 4000 
« BPF 
« BPF 
« BPF 
« BPF 















































31.3 bp£ if[][] 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































BPF BPF bpf if 
bpf iflist 31-4 BPF 
esc.h 
67 struct bpf if ( bpfä 
68 struct bpf_if *bif_next; /* list of all interfaces */ 
69 struct bpf_d *bif dlist; /* descriptor list */ 
70 struct bpf_if **bif_driverp; /* pointer into softc */ 
71 u_int bif_dlt; /* link layer type */ 
72 u_int bif_hdrlen; /* length of header (with padding) */ 
73 struct ifnet *bif_ifp; /* correspoding interface */ 
74 Y; 
bpfdesc.h 
0 31-4 bp£ if OD 
67-79 bif next BPF bif dlist 
BPF 
70 BPF bif driverp ifnet 
bpf if *pif driverp 
BPF *bif driverp bif if BPF 
7 bif dltl] [] 31-5 | 0 
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31 BPF[] BSD 



















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































bif dlt U Ë 
DLT_EN10MB MO 0000 
DLT SLIP SLIP] [| 
DLT NULL 0000 
031-5 bir alt [J] 
72-74 BPF BPF bif_hdrlen 
bif ifp ifnet 
31-6 bpf hdr 
122 struct bpf_här { bpf.h 
123 struct timeval bh tstamp; /* time stamp */ 
124 u long bh caplen; /* length of captured portion */ 
125 u_long bh datalen; /* original length of packet */ 
126 u short bh hdrlen; /* length of bpf header (this struct plus 
127 alignment padding) */ 
128 }; 
bpf.h 
[] 31-6 bpf har [] [J 
122-128 bh tstamp bh caplen BPF 
bh datalen bh headlen bpf hdr 
BPF bif hdrlen 
31-7 bpf if 3 (le. softc [0][] sl softc[0] 
loif)[]] ifnet 
bpf iflist: 
bpf if() bpf_if{} bpf if() 
bif dlist bif dlist = 
B bif_dlt DLT SLIP | bif dit DLT NULL 
bif_härlen bif hdrlen |20 
le softc[0]: 








D 31-7. bef if [] ifnet D D 































































































sc bpf 























if bpf 























bif driverp 





























SLIP BPF 

































































SLIP 


























if bpf 


























sc bpf 
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TCP/IP 2 
if_bpf ifnet Net/2 ifnet if_bpf 
bpfattach 3 
3 bpfattach SLIP 
bpfattach BPF 31-8 
1053 void bpf.c 


1054 bpfattach(driverp, ifp, dlt, hdrlen) 
1055 caddr_t *driverp; 

1056 struct ifnet *ifp; 

1057 u_int dit, hdrlen; 


































































































































































































































































































































































































































































































1058 { 
1059 struct bpf_if *bp; 
1060 int i; 
1061 bp = (struct bpf if +) malloc(sizeof(*bp), M DEVBUF, M DONTWAIT); 
1062 if (bp -- 0) 
1063 panic("bpfattach"); 
1064 bp->bif_dlist = 0; 
1065 bp->bif_driverp = (struct bpf_if **) driverp; 
1066 bp->bif_ifp = ifp; i 
1067 bp->bif_dlt = dlt; 
1068 bp->bif nezt = bpf_iflist; 
1069 bpf_iflist = bp; 
1070 *bp->bif_driverp = 0; 
1071 /* 
1072 * Compute the length of the bpf header. This is not necessarily 
1073 * equal to SIZEOF BPF HDR because we want to insert spacing such 
1074 * that the network layer header begins on a longword boundary (for 
1075 * performance reasons and to alleviate alignment restrictions). 
1076 */ 
1077 bp->bif_hdrlen = BPF WORDALIGN(hdrlen + SIZEOF,.BPF HDR) - harlen: 
1078 /* 
1079 * Mark all the descriptors free if this hasn't been done. 
1080 */ ` 
1081 if (!D ISFREE(&bpf dtab[0])) 
1082 for (i = 0; i < NBPFILTER; ++i) 
1083 D MARKFREE (&bpf dtab[il); 
1084 printf("bpf: %s%d attached\n", ifp->if name, ifp->if unit); 
1085 ) 
bpf.c 
O 31-8 bpfattach J [| 
1053-1063 BPF bpfattach 
bif driverp (U 31-4 ) ifnet 
bpf_if 
1. bpf-if 
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1064-1070 bpf if BPF 
bpf iflist 
2. BPF 
1071-1077 bif hdrlen (U IP ) 
BPF 31-9 3 
BPF 
180 0 140 0 
DO 
woes | mem — [ws 36] 
180 O 200 160 0 
DD 
O000000 





180 D 200 





m || TI  = 30 


400 


0 31-9 BPE ODO 

























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































ether_header 4-10 SLIP 5-14 
5-28 
SLIP| 2 IP 4 
3. bpf dtab 
1078-1083 31-10 BPF 
bpfattach 
4. | 
1084-1085 BPF 
31.4 bp£ aj O 
BPF ictl 
BPF BPF 
bpf d 31-10 
45-46 BPF bpf d 
bd next 
47-52 bpf d bd sbuf ( 
) bd. £buf( ) 
bd hbuf( ) bd slen[] bd hlen 
















































































































































































626 


TCP/IP 

































































































































































45 struct bpf_d { 
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bpfdesc.h 

















































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































46 struct bpf_d *bd next; /* Linked list of descriptors */ 
47 caddr_t bd sbuf; /* store slot */ 
48 caddr t bd hbuf; /* hold slot */ 
49 caddr_t ba_fbuf; /* free slot */ 
50 int bd_slen; /* current length of store buffer */ 
51 int bd hlen; /* current length of hold buffer */ 
52 int bd_bufsize; /* absolute length of buffers */ 
53 struct bpf_if *bd_bif; /* interface descriptor */ 
54 u long bd rtout; /* Read timeout in 'ticks' */ 
55 struct bpf_insn “bd filter; /* filter code */ 
56 u long bd_rcount; /* number of packets received */ 
57 u long bd dcount; /* number of packets dropped */ 
58 u_char bd_promisc; /* true if listening promiscuously */ 
59 u_char bd state; /* idle, waiting, or timed out */ 
60 u_char bd_immediate; /* true to return on packet arrival */ 
61 u_char bd_pad; /* explicit alignment */ 
62 struct selinfo bd sel; /* bsd select info */ 
63 }; 
bpfdesc.h 
[] 31-10 bet a QQ 
bd hbuf bd sbuf 
bd fbuf ROTATE BUFFERS 
bd hbuf bd sbuf bd fbuf 
bd bufsize 4096(BPF BUFSIZE) 
BIOCSBLENoctl 
BPF bd bufsize[] BIOCGBLEN bd bufsize 
32768 (BPF MAXBUFSIZE) 32(BPF MINBUFSIZE) 
53-57 bd bif BPF bpf. if BIOCSETIF 
bd rtout bd filter BPF 
BIOCGSTATS bd rcount[]| bd dcount 
58-63 bd promisc BIOCPROMISC 
(promiscuous) bd state bd immediate BIOCIMMEDIATE 
bd pad bpf d 
bd sel selinfo select 
BPF select 16.13 select 
31.4.1 bpfopen 
open BPF bpfopen([] 31-11) 
256-263 BPF NBPFILTER 
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| NBPFILTER 0 ENXIOĻUUUUUUUUUUULU /dev/bpe£xl] [I 
NBPFILTER| O 




































































































































































































































































































































































































































































































































































































































































































































































bpf.c 
256 int rf 
257 bpfopen (dev, flag) 
258 dev t dev; 
259 int flag; 
260 { 
261 struct bpf_d *d; 
262 if (minor (dev) >= NBPFILTER) 
263 return (ENXIO); 
264 /* 
265 * Each minor can be opened by only one process. If the requested 
266 * minor is in use, return EBUSY. 
267 */ 
268 d = &bpf_dtab[minor (dev) ]; 
269 if (ID ISFREE(d)) 
270 return (EBUSY); 
271 /* Mark "free" and do most initialization. */ 
272 bzero((char *) d, sizeof(*d)); 
273 d->bd bufsize = bpf bufsize; 
274 return (0); 
275 T 
bpf.c 
[] 31-11 bpfopen [] U 
| bpf d 
264-275 | | | BPF bp£_al] O E 
EBUSY|[ O tepdume | DI | | | 0 0 
000000008 00-01 bpf dtab[] DU Í U U U 0 U 
31.4.2 bpfioctl[|| 
U O ioct1[] ut O 31-120 [] | BPF | ioctll]| 
31-13[] bpfioct ll | BIOCSETF[] BIOCSETIE| | 
| ioct1[]| Hl L 
0 U 00000 Oo U 0 U 
FIONREAD u_int bpfioctl 60000000000 0000 
BIOCGBLEN u_int bpfioctl 0000000 
BIOCSBLEN u_int bpfioctl 000000 
BIOCSETF struct bpf_program bpf_setf O O BPFO O 
BIOCFLUSH reset_d 00000 
BIOCPROMISC ifpromisc 00000 
BIOCGDLT u_int bpfioctl DO bif dit 
BIOCGETIF struct ifreq bpf_ifname 00000000 
BIOCSETIF struct ifreq bpf_setif 0000000090 
BIOCSRTIMEOUT struct timeval bpfioctl [| p” 000000 
BIOCGRTIMEOUT struct timeval bpfioctl 0 "0 "0000000 
BIOCGSTATS struct bpf_stat bpfioctl O O BPFO O O 
BIOCIMMEDIATE u_int bpfioctl 000000 
BIOCVERSION struct bpf_version bpfioctl O O BPH[] H J Ú 












































D 31-12 BPF iocı H 0 












































828 n n: China+pub.tom 
TT Aan | 


bpf.c 





501 int 
502 bpfioctl(dev, cmd, addr, flag) 
503 dev t dev; 


504 int cmd; 

505 caddr t addr; 

506 int flag; 

507 I 

508 struct bpf d *d = &bpf dtab [minor (dev)]; 

509 int 8, error = 0; 

510 switch (cmd) ( 

511 /* 

512 * Set link layer read filter. 

513 *f 

514 case BIOCSETF: 

515 error - bpf setf(d, (struct bpf program *) addr); 
516 break; 

517 /* 

518 * Set interface. 

519 */ 

520 case BIOCSETIF: 

521 error = bpf setif(d, (struct ifreq *) addr); 
522 break; 





668 default: 


669 error = EINVAL; 
670 break; 

671 } 

672 return (error); 


673 T 


al em A =: ee bpf.c 








































































































































































































































































































































































































































































































































































































































































































D 31-13 bpfioctl OO 
501-509 bpfopen bpf dtab bpf d 
switch/case BIOCSETE|| BIOCSETIF 
default 
510-522 bpf sert addr bpf setif 
bpf d bpf setf 
668-673 EINVAL 
31-14 bpf setif bpf d LANCE 
bif dlist bpf_dtab[0] 




















































































































bpf dtab[0] bd sbuf|| bd hbuf 








































































































































































































































































































































































































4096(bd bufsize) bd bif bpf if 
ifnet (Je softc[0] if bpf bpf if 4-19 4-11 
if bpf bpf tap BPF 
31-15 31-10 BPF 
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bpf_iflist: 





bp£ if() - 
bif next -|----- » JO Obpf if] O 
bif_driverp 
bif_dlt 
bif_hdrlen 
bif_ifp 




















le softc[0]: 
















bpf dtab[2][] 
bpf dtab[NBPFILTER-1] 





O 31-14 000000000 BPF[I D 


bpf iflist: 





bpf_ift} 
Sehe: =» [OC per if[ D 






bpf dtab: 














bpf dtab[2][] 
bpf dtab[NBPFILTER-1] 





03115 00000000000 BPFOD 


830 
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TCP/IP 2 
BPF bpf_dtab bpf_d 
bpf dtab[l] BPF bif dlist 
bpf dtab[l] bpf dtab[l].bd next bpf dtab[0] 
BPF 
31.4.3 bpf_setif 
bpf setif BPF 31-16 
Seen bpf.c 

721 static int 

722 bpf setif(d, ifr) 

723 struct bpf_d *d; 

724 struct ifreg *ifr; 

725 I 

726 struct bpf if *bp; 

727 char *cp; 

728 int unit, s, error; 

729 /* 

730 * Separate string into name part and unit number. Put a null 

731 * byte at the end of the name part, and compute the number. 

732 * If the a unit number is unspecified, the default is O, 

733 * as initialized above. XXX This should be common code. 

734 */ 

735 unit = 0; 

736 Cp = ifr-»ifr name; 

737 cp[sizeof(ifr-»ifr name) - 1] = "VO"; 

738 while (*cp++) { 

739 if (*cp >= '0’ && *cp <= "9") L 

740 unit = *cp - '0'; 

741 *cp++ = "VO"; 

742 while (*cp) 

743 unit = 10 * unit + *cp++ - "Di? 

744 break; 

745 ) 

746 ) 

747 /* 

748 * Look through attached interfaces for the named one. 

749 */ 

750 for (bp - bpf iflist; bp !- 0; bp - bp-»bif next) ( 

751 struct ifnet *ifp = bp->bif_ifp; 

752 if (ifp == || unit != ifp->if_unit 

753 il stremp(ifp->if name, ifr->ifr name) !- 0) 

754 continue; 

755 /* 

756 * We found the requested interface. 

757 * If it's not up, return an error. 

758 * Allocate the packet buffers if we need to. 

759 * If we're already attached to requested interface, 

760 * just flush the buffer. 

761 */ 

762 jf ((ifp->if_flags & IFF_UP) == 0) 

763 return (ENETDOWN) ; 


[] 31-16 bpf setif OQ 
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764 if (d->bd sbuf == 0) ( 
765 error = bpf allocbufs(d); 
766 if (error != 0) 
767 return (error); 
768 } 
769 s = splimp(); 
770 if (bp != d->bd bif) { 
771 if (d->bd_bif) 
772 /* 
773 * Detach if attached to something else. 
774 KL 
775 bpf detachd (d); 
776 bpf attachd(d, bp); 
777 ) 
778 reset d(d); 
779 splx(s); 
780 return (0); 
781 } 
782 /* Not found. */ 
783 return (ENXIO); 
784 ) 
bpf.c 
[ 31-16 (D) 
721-746 bpf setif ifreq (O 4-23) 
unit ifr name 4 " s11N0" 
" S1NONO" unit 1 
1. ifnet 
747-754 for BPF (pt iflist[]) ifreq 
755-768 ENETDOWN bpf_allocate 
bpf_d 
2. bpf_d 
769-777 BPF ifreg 
bpf_detachd ( ) bpf_attachd 
778-784 reset_d 0 
ENXIO 
31.4.4 bpf_attachd|] 
31-170] bpf_attachd BPF BPF 
bpf.c 





189 static void 

190 bpf attachd(d, bp) 
191 struct bpf_d *d; 
192 struct bpf if *bp; 


193 { 
194 /* . 
195 * Point d at bp, and add d to the interface's list of listeners. 


[] 31-17 eg attachd [] D 
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196 * Finally, point the driver’s bpf cookie at the interface so 
197 * jt will divert packets to bpf. 
198 */ ` 
199 d->bd bif = bp; 
200 d->bd nezt - bp->bif dlist; 
201 bp->bif_dlist = d; 
202 *bp->bif_driverp bp; 
TE A  — MÀ 
0 31-17 (0) 
189-203 bd_bif BPF bpf_d 
bpf_d BPF BPF 
BPF 
315 BPFD I D 
BPF read BPF 
BPF 
31.5.1 bpf tap 
4-11] LANCE bpf tap 
bpf tap 4-11 
bpf tap(le-»sc if.if bp buf, len + sizeof(struct ether header)); 
31-18 bpf tap 
| bpf.c 
869 void 
870 bpf_tap(arg, pkt, pktlen) 
871 caddr_t arg; 
872 u_char *pkt; 
873 u_int pktlen; 
874 { 
875 struct bpf_if *bp; 
876 struct bpf d *d; 
877 u int slen; 
878 /* 
879 * Note that the ipl does not have to be raised at this point. 
880 * The only problem that could arise here is that if two different 
881 * interfaces shared any data. This is not the case. 
882 */ 
883 bp - (struct bpf if *) arg; 
884 for (d = bp->bif dlist; d != 0; d = d->bd next) 
885 ++d->bd rcount; 
886 slen = bpf filter(d->bd filter, pkt, pktlen, pktlen); 
887 if (slen != 0) 
888 catchpacket(d, pkt, pktlen, slen, bcopy); 
889 } 
890 } 
bpf.c 





O 31-18 bpf tap OO 
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869-882 bpf_if bpfattach 
(1400 ) 
BPF 
883-890 for BPF 
bpf_filter catchpacket 
slen 0 bpf_tap 
BPF 
bpf_mtap BPF bpf_tap 
mbuf 

























































































































































































31.5.2 catchpacket[] 


























31-18 catchpacket 31-19 




































































































































































946 
947 
948 
949 
950 
951 
952 
953 
954 
955 
956 
957 
958 
959 
960 
961 
962 
963 
964 


965 
966 
967 
968 
969 
970 
971 
972 
973 
974 
975 
976 
977 
978 
979 
980 





bpf.c 


static void 
catchpacket (d, pkt, pktlen, snaplen, cpfn) 
struct bpf d *d; 
u char *pkt; 
u int pktlen, snaplen; 
void (*cpfn) (const void *, void *, u int); 
{ 
struct bpf_hdr *hp; 


int totlen, curlen; 
int hdrlen = d->bd_bif->bif_härlen; 
/* 


* Figure out how many bytes to move. If the packet is 
* greater or equal to the snapshot length, transfer that 
* much. Otherwise, transfer the whole packet (unless 
* we hit the buffer size limit). 
*/ 
totlen = hdrlen + min(snaplen, pktlen); 
if (totlen > d->bd_bufsize) 
totlen = d->bd_bufsize; 
/* 
* Round up the end of the previous packet to the next longword. 
SZ 
curlen = BPF WORDALIGN(d->bd slen); 
if (curlen + totlen > d->bd bufsize) { 
FE å 
* This packet will overflow the storage buffer. 
* Rotate the buffers if we can, then wakeup any 
* pending reads. 
*/ 
if (d->bd_fbuf == 0) ( 
/* 
* We haven't completed the previous read yet, 
* so drop the packet. 
* 
++d->bd_dcount; 


O 31-19 catchpacket UI 
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2 
981 return; 
982 } 
983 ROTATE BUFFERS (d); 
984 bpf wakeup (d); 
985 curlen - 0; 
986 ) else if (d->bd immediate) 
987 /* 
988 * Immediate mode is set. A packet arrived so any 
989 * reads should be woken up. 
990 Sp 
991 bpf_wakeup (d) ; 
992 £* 
993 * Append the bpf header. 
994 */ 
995 hp = (struct bpf hdr *) (d->bd_sbuf + curlen); 
996 microtime (&hp->bh_tstamp) ; i 
997 hp->bh_datalen = pktlen; 
998 hp->bh hdrlen = hdrlen; 
999 /* 
1000 * Copy the packet data into the store buffer and update its length. 
1001 */ 
1002 (*cpfn) (pkt, (u char *) hp + hdrlen, (hp->bh_caplen = totlen - härlen)); 
1003 d->bd_slen = curlen + totlen; 
1004 } 
bpf.c 
H 31-19 (O) 
946-955 catchpacket d BPF pkt 
pktlen snaplen 
cpfn pkt 
cptn bcopy mbuf|] (pkt mbu mbu 
cptn bpf mcopy 
956-964 catchpacket bpf_hdr 
Snap len pktlen bpf_hdr 
(bd_bufsize ) 
1. 
965-985 curlen 
( ) 
ROTATE BUFFERS bpf wakeu 
2. 
986-991 === 
3 BPF 
992-1004 (microtime) bpf_hdr cptf 
mbuf] bpf tab leread 
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03/0 BPFO BSDO ( D 























U U U 


31.5.3 bpfread[|[] 
































































































































































































































































































































































































































OM | BPF[] [] [| read] [| [| ppfread O 0 BIOCSRTIMEOUT[ O O BPF[] 
unu oo00*00”0000 select 0000000000 tepdume O00 
BIOCSRTIMEOUTJ [ 0 select 0000000000000000000000000 
000 BicoeeL.en 000000000000000000000 00000000 
OO0O00000000000000000 read O 000000 U U U U U 
U U BPE D 0000000 UO OO OD 31-200 bpfread[] 

344 int bpf.c 


345 bpfread(dev, uio) 
346 dev t dev; 
347 struct uio *uio; 


348 ( 
349 
350 
351 


352 
353 
354 
355 
356 
357 


358 
359 
360 
361 
362 
363 
364 
365 
366 
367 
368 
369 
370 
371 
372 
373 
374 
375 
376 
377 
378 
379 
380 
381 
382 
383 
384 
385 


struct bpf d *d = &bpf dtab[minor(dev)]; 


int error; 
int Si 
/* 


* Restrict application to use a buffer the same size as 
* as kernel buffers. 
*/ 
if (uio->uio_resid != d->bd_bufsize) 
return (EINVAL); 


s = splimp(); 
/* 
* If the hold buffer is empty, then do a timed sleep, which 
* ends when the timeout expires or when enough packets 
* have arrived to fill the store buffer. 
=) 
while (d->bd hbuf == 0) { 
if (d->bd_immediate && d->bd_slen != 0) { 
/* 
* A packet(s) either arrived since the previous 
* read or arrived while we were asleep. 
* Rotate the buffers and return what's here. 
*/ 
ROTATE BUFFERS (d); 
break; 
) 
error = tsleep((caddr t) d, PRINET | PCATCH, "bpf", d-»bd rtout); 
if (error == EINTR || error == ERESTART) { 
splx(s); 
return (error); 
} 
if (error == EWOULDBLOCK) { 
/* 
* On a timeout, return what's in the buffer, 
* which may be nothing. If there is something 
* in the store buffer, we can rotate the buffers. 
*/ 
if (d->bd hbuf) 


[] 31-20 bpfread J [] 


636 
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TCP/IP [l-2 
386 /* 
387 * We filled up the buffer in between 
388 * getting the timeout and arriving 
389 * here, so we don't need to rotate. 
390 */ 
391 break; 
392 if (d->bd_slen == 0) { 
393 splx(s); 
394 return (0); 
395 } < 
396 ROTATE_BUFFERS (d) ; 
397 break; 
398 ) 
399 } 
400 /* 
401 * At this point, we know we have something in the hold slot. 
402 */ 
403 splx(s); 
404 /* 
405 * Move data from hold buffer into user space. 
406 * We know the entire buffer is transferred since 
407 * we checked above that the read buffer is bpf_bufsize bytes. 
408 “7 
409 error = uiomove(d->bd hbuf, d->bd_hlen, UIO READ, uio); 
410 s = splimp(); 
411 d->bd fbuf = d->bd hbuf; 
412 d->bd hbuf = 0; 
413 d->bd hlen = 0; 
414 splx(s); 
415 return (error); 
416 3 
bpf.c 
1 31-20 (0) 
344-357 U bpf dtabl | |] BPF | U BPF 
EINVAL 
1. 
358-364 BPF 
while Hl u 
BPF | U ( 31.2) 
2: 
365=373 while 
3. 
374-384 |] 
LU U u LU 
EINTR|| ERESTART 
o ERESTART syscalll] 
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385-391 
Sr 
392-399 read 0 
tsleep while 
6. 
400-416 uiomove bd hlen 
uiomove 
uiomove bd hlen 
BPF bd butai zell 
31.6 BPFO [| Ü 
BPF 
(U 4-8) 
bpfwrite 
write 31-21 bpfwrite 
BPF 
C 
437 int bpf. 
438 bpfwrite (dev, uio) 
439 dev_t dev; 
440 struct uio *uio; 
441 { 
442 struct bpf_d *d = £bpf_dtab[minor (dev)]; 
443 struct ifnet *ifp; 
444 struct mbuf *m; 
445 int error, s; 
446 static struct sockaddr dst; 
447 int datlen; 
448 if (d->bd_bif == 0) 
449 return (ENXIO); 
450 ifp = d->bd_bif->bif_ifp; 
451 if (uio->uio resid == 0) 
452 return (0); 
453 error = bpf movein(uio, (int) d->bd bif->bif dlt, &m, &dst, &datlen); 
454 if (error) 
455 return (error); 
456 if (datlen > ifp->if mtu) 
457 return (EMSGSIZE); 
458 s = splnet (); 
459 error = (*ifp->if output) (ifp, m, &dst, (struct rtentry *) 0); 
460 splx(s); 


[| 31-21 bpfwrite JQ 
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461 /* 
462 * The driver frees the mbuf. 
463 */ 
464 return (error); 
465 } 
bpf.c 
[] 31-21 (0) 
JE 
437-449 BPF 
ENXIO 
2. [|] mbu 
450-457 write 0 OL] bpf_movein 
mbuf] bif dlt 
datlen dst sockaddr 
| AF UNSPEC mbuf] 
MTU EMSGSIZE 
3. 
458-465 ifnet if_output mbu 
if_output ether_output 
317 00 
BPF BPF L 
BPF 
BPF BPF 
read 
BPF BPF 0 0 
Net/3 
U U 
31.1 BPF catchpacket bpf_wakeup 
31.2 31-20 U BPF[] L L 31-11 
BPF 



















































































































































































31.3 BIOCSETIF BPF 























Ais 


us] pn n IP 
























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































32.1 [I] 
Internet | SOCK RAW IP 
| 3 
1) ICMP[] IGMP 
Ping ICMP ICMP 
ICMP 
19.7 Net/3 
RTM_REDIRECT 
ICMP (0 10 9.60 ) 
ICMP 
IGMP IGMP 
2) IP 
UDP IP] UDP 
3) IP IP 
gated IP EGP[] HELLO[] OSPF 
IP 
IP 
32.2 JO 00 
32-1 C 5 IP 
0 U [] [] 
netinet/raw ip.c Hu pied gut 
0321 JO00000 
32-2 5 IP 
5 IP 
“ rip” 2 IP (Raw IP)" = (Routing Information Protocol)” 
RIP) 
32.2.1 g 


























4 32-3 
































































































































840 TCP/IP D 20 Chinapub.tom 
































getsockopt 
00000 SANAAA setsockopt 000000 








domaininit 








an 
0322 [0 POO0O00000000000 

















0 D 0000 | 0 D 

rawinpcb struct inpcb O O IPO Internet PB] [] O O 
ripsrc | struct sockaddr iM 000000000 IPO [|] 
rip_recvspace u_long 000000000000 819200 
rip sendspace u long O00000000000 819200 


032-3 200209000000 





3222 ID 




















OO PO ipstat O (0 839000 




















0000 32-4] 0 























ips_noprete 
ips_rawout O0000P00000 























D 32-4. ipstat D D D D D D D D odd 
8-60 000 SNMP[] [| [| ips_noprotol] | | D 8-5] OOOD | | 



























































































































































32.3 DD IPO protoswl] O 





















































































































































































































































O 00 inet sv 00000 | U IPQ inetsv] OOD 4 
O00 sock RAWD D I 

e IPPROTO ICMP(] DD DO 

* IPPROTO IGMP( 2) 

e IPPROTO RAW 255) 



































32 

















IP 

































































































































































































































































641 






























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































° IP ( 0) 
ICMP[] IGMP (U 11-12 13-9) 
. [] (SOCK RAM] D (socket ) 
IPPROTO ICMP[] IPPROTO IGM IPPROTO RAW 
protosw 
. (SOCK RAW) 
pffindproto 0 IP 
1.8 | ip_protox DH IPPROTO_RAW 
32-5 
N O inetsw[3] U O 
pr_type SOCK_RAW [1 O D 
pr domain & inetdomain O O Internet] O O O IP 
pr_protocol IPPROTO RAW(255) NO E] IP D] D]. ip ll 0 
pr flags PR ATOMIC|PR ADDR U U 0 D 0 D 00 
pr input rip input U iP D D D OLD 
Pr output 0 DU D Ip 0 0 
pr ctlinput 0 OO Ip D 
pr_ctloutput rip_ctlinput O0O000000000 
pr usrreq rip usrreq OOO000000000 
pr init 0 OO Ip D 
pr_fasttimo 0 OO rood 
pr_slowtimo 0 O O IPO O Ú 
pr_drain 0 O O rood 
pr syseti 0 U D rood 
032-5 DO IP] protosw O [| 
3 rip rip_output 
IP rip_usrreq 
IP rip_init g 
IPPROTP_RAW | 
32-5 (ICMP[] IGMP) protosw 
IP 32-61) 4[] SOCK_RAW protosw 
protosw [— Sock RAW H 000 
00 IPPROTO_ICMP (1) | IPPROTO IGMP (2) U U ©) 
pr input icmp input igmp input rip input rip input 
pr_output rip. output rip output rip output rip output 


pr_ctloutput 
pr_usrreg 

pr_init 0 
pr_sysctl 
pr_fasttimo 0 








rip ctloutput 
rip usrreg 


icmp syscti 














rip_ctloutput 
rip usrreg 
igmp init 

0 

igmp fasttimo 


rip usrreg 





0326 4000000000000 


rip_ctloutput 















rip_ctloutput 
rip_usrreg 
zip_init 

0 
0 














842 
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TCP/IP 2 
BSD IP ip_protox 
IPPROTO_RAW IP 0 
IP 
IPPROTO_RAW Van Jacobson Traceout 
IP ( TTL ) Traceout 
4.3BSD[] Net/1 rip output IPPROTO RAW 
IP IP Net/2 
IP HDRINCL IPPROTO RAW | 
IP 
32.4 rip init[] |] 
domaininit IP rip. init ([ 32-7) 
47 void raw ip.c 
48 rip init() 
49 ( 
50 rawinpcb.inp, next - rawinpcb.inp prev - &rawinpcb; 
51} 
raw_ip.c 
0 32-7 rip init [N 
PCB (rawinpcb) 
socket SOCK RAW IP 
PRU ATTACH Internet PCB rawinpcb 
32.5 rip inputi |] 
ip protox IPPROTO RAW([] 7-8) 
pr input rip input ([] 32-6) IP 
32-2 ICMP[] IGMP rip input 
*icmp input rip input ICMP ICMP 
e igmp_input rip_input IGMP 
rip_input 
ICMP[] IGMP 
32-8 | rip input 
59 void raw. ip.c 
60 rip input (m) 
61 struct mbuf *m; 
62 ( 
63 struct ip *ip = mtod(m, struct ip *); 
64 struct inpcb *inp; 


[] 32-8 


rip input DD 
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65 struct socket *last = 0; 
66 ripsrc.sin addr = ip-»ip src; 
67 for (inp = rawinpcb.inp next; inp !- &rawinpcb; inp = inp->inp next) ( 
68 ` if (inp-»inp ip.ip p && inp-»inp ip.ip p != ip-»ip p) 
69. . continue; E : 
70 if (inp->inp_laddr.s_addr && 
71 inp->inp_laddr.s_addr == ip->ip_dst.s_addr) 
72 continue; 
73 if (inp->inp_faddr.s_addr && 
74 inp->inp_faddr.s_addr == ip->ip_src.s_addr) 
75 continue; 
76 if (last) { 
77 struct mbuf *n; 
78 if (n = mcopy(m, 0,. (int) M_COPYALL)) { 
79 if (sbappendaddr(&last-»so rcv, &ripsrc, 
80 n, (struct mbuf *) 0) == 0) 
81 /* should notify about lost packet */ 
82 m freem(n) ; 
83 else E 
84 2 sorwakeup (last); 
85 ) I 
86 ) 
87 last = inp->inp_socket; 
88 ) 
89 if (last) ( - 
90 if (sbappendaddr (£last->so_rcv, &ripsrc, 
91 m, (struct mbuf *) 0) == 0) 
92 m_freem(m); : 
93 else 
94 Sorwakeup (last); 
95 ) else ( B 
96 : m freem(m); 
97 ipstat.ips_noproto++; 
98 ipstat.ips_delivered--; 
99 } 
100 } . 
raw p.c 
H 32-8 (U) 
59-66 IP ripsrc PCB 
ripsrc sbappendaddr UDP IP 
sockaddr_in sin_port 0 
2. IP PCB 
67-88 IP PCB UDP[] TCP 
( ) in pcblookup 
( ) IP 
in pcblookup PCB PCB 
UDP ([] 23-26) 
3. 
68-69 PCB IP PCB 
O(socket ) IP 
4 IP| 
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TCP/IP 2 
70-75 PCB IP IP PCB 
PCB IP IP PCB 
3 0 
rip_input 
71 74 
5. 
76-94 sbappendaddr last 
23-26 sbappendaddr mbu 
rip input m copy 
6. 
95-99 | mbuf ips_noproto 
ips delivered[]IP rip input (U 8-15) 
ips delivered SNMP 
ipInDiscards[] ipInDelivers ([] 8-16) 
icmp input 
rip input ICMP rip input 
PCB[] ips noproto 8-5 
IP 
Net/3 2( VT ICMP 
RFC 1122 | [] ICMP ( 32.4) 
32.6 rip output[|[| 
32-6 ICMP[] IGMP IP rip_output IP 
send|| sendto|| sendmsg|| write writev 
5 sendto[] sendmsg 
sendto[] sendmsg U 
32-9 rip_output 
1. IP 
119-128 TP_HDRINCR M PREPEND[| IP IP 
ip output ([] 8-22) PCB 
32-10[] socket 
TOS 00 TTL 255 IP 
UDP[] TCP | IP TTI[| IP TOS 
129 | IP OPTIONS IP opts 
ip output 
2. IP IP HDRINCR 
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130-133 IP_HDRINCR IP 
ID 0 IP ID IP ID 
0 rip. outputl] ID ID 
O[] rip output ip id IP ID 
134-136 opts IP OPTIONS IP 
IP IP flags 
IP_RAWOUTPUT ip_output IP 
105 EE rav ip.c 
105 int 
106 rip_output (m, so, dst) 
107 struct mbuf *m; 
108 struct socket *so; 
109 u_long dst; 
110 { 
111 struct ip *ip; 
112 struct inpcb *inp = sotoinpcb(so); 
113 struct mbuf *opts; 
114 int flags = (so->so options & SO_DONTROUTE) | IP_ALLOWBROADCAST; 
115 /* š 
116 * If the user handed us a complete IP packet, use it. 
117 * Otherwise, allocate an mbuf for a header and fill it in. 
118 */ 
119 if ((inp->inp_flags & INP_HDRINCL) == 0) I 
120 M PREPEND(m, sizeof(struct ip), M_WAIT); 
121 ip = mtod(m, struct ip *); 
122 ip->ip_tos = 0; 
123 ip->ip_off = 0; 
124 ip->ip_p = inp->inp_ip.ip_p; 
125 ip->ip_len = m->m_pkthdr.len; 
126 ip-»ip src = inp->inp_laddr; 
127 ip->ip_dst.s_addr = dst; 
128 ip->ip_ttl = MAXTTL; 
129 opts = inp->inp_options;; 
130 } else { 
131 ip = mtod(m, struct ip *); 
132 if (ip->ip_id == 0) 
133 ip->ip_id = htons(ip id++); 
134 opts = NULL; - 4 
135 /* XXX prevent ip output from overwriting header fields */ 
136 flags |= IP RAWOUTPUT; 
137 ipstat.ips rawout++; 
138 } Š 
139 return (ip_output (m, opts, &inp->inp_route, flags, inp-»inp moptions)); 
140 ) å I 


[] 32-9 rip output UI 





































































































137 ips_rawout Traceroute Traceroute 






















































































Net/3 IP_HDRINCL 
ID 








































































































rip_output 











































































































rip output[]IP 
0 IP RAWOUTPUT Net/3 ip. output IP 



















































































































































































646 
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TCP/IP 2 
Net/2 IP_HDRINCL IP 
IP 4 0 
32.7 rip_usrreq[] [| 
UDP[] TCP 
rip_usrreq switch PRU xxx case 
32-10 PRU ATTACH socket 
A raw_ip.c 
194 int 
195 rip usrreg(so, reg, m, nam, control) 
196 struct socket *so; ` 
197 int reg; 
198 struct mbuf *m, *nam, *control; 
199 { 
200 int error = 0; 
201 struct inpcb *inp = sotoinpcb (so); 
202 extern struct socket *ip_mrouter; 
203 switch (req) { 
204 case PRU_ATTACH: 
205 if (inp) 
206 panic("rip attach"); 
207 if ((so->so state & SS PRIV) == 0) ( 
208 error = EACCES; 
209 break; 
210 } 
211 if ((error = soreserve(so, rip sendspace, rip recvspace)) || 
212 (error = in_pcballoc (so, &rawinpcb))) 
213 break; 
214 inp = (struct inpcb +) so->so_pcb; 
215 inp->inp_ip.ip_p = (int) nam; 
216 break; i . 
raw ip.c 
[] 32-10 rip usrreq U D [| PRU ATTACH Un 
194-206 Socket Socket 
Internet PCB 
1. 
207-210 IP 
| 
2. Internet PCB 
211-215 in_pcballoc Internet PCB 
IP PCB (rawinpcb) socket rip_usrreq|| nam 
socket PCB rip_input 
rip_output 
IP_HDRINCL ) 
IP IP UDP IP 
rip_input IP 
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UDP PRU_DISCONNECT 
1) PRU_DETACH PRU_DISCONNECT 
2) connect[] soconnect PRU_CONNECT 
PRU_DISCONNECT 
32-11 PRU_DISCONNECT|| PRU_ABORT|| PRU_DETACH 

217 case PRU_DISCONNECT: BIER 

218 if ((so->so_state & SS_ISCONNECTED) == 0) { 

219 error = ENOTCONN; : 

220 break; 

221 } 

222 /* FALLTHROUGH */ 

223 case PRU_ABORT: 

224 soisdisconnected (so); 

225 /* FALLTHROUGH */ 

226 case PRU_DETACH: 

227 if (inp == 0) 

228 panic("rip detach"); 

229 if (so == ip mrouter) 

230 ip mrouter done(); 

231 in pcbdetach(inp); 

232 break; 


[] 32-11 rip usrreq [| [| [| PRU DISCONNECT [| PRU ABORT [] PRU DETACH [|] [] 























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































217-222 | PRU DISCONNECT 0 0 Ü 
223-225 PRU_ABORT case 
PRU_DISCONNECT 
226-230 close PRU_DETACH case 
PRU_DISCONNECT socket (ip_mrouter) 
ip_mrouter_done 0 mrouted (8) 
DVMPR DONE mrouted (8) 
231 in pcbdetach Internet PCB IP PCB[] (rawinpcb) 
PRU BIND IP IP 32-12 

rip input 

233-250 sockaddr in IP 3 
EADDRNOTAVAIL 

1) IP 

2) AF_INET ( AF_IMPLINK ) 

3) | TP 0.0.0.0 [] sockaddr_in 

0 ifa_ifwithaddr 





























































































































IP PCB 
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TCP/IP 2 
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raw_ip.c 
233 case PRU_BIND: 
234 { 
235 struct sockaddr_in *addr = mtod(nam, struct sockaddr_in *); 
236 if (nam->m_len != sizeof(*addr)) { 
237 error = EINVAL; 
238 break; 
239 } 
240 if ((ifnet == 0) |I 
241 ((addr->sin_family != AF_INET) && 
242 (addr->sin family != AF IMPLINK)) || 
243 (addr->sin addr.s addr && 
244 ifa ifwithaddr((struct sockaddr *) addr) == 0)) { 
245 error = EADDRNOTAVAIL; 
246 break; 
247 } 
248 inp->inp laddr = addr->sin_addr; 
249 break; : 
250 } š 
raw ip.c 
[] 32-12 rip usrreq [ [| [| PRU BIND nt 
IP IP rip input 
IP IP 
bindl| connect rip input 
32-13 PRU CONNECT 
251-270 Sockaddr in IP 
PCB UDP IP 
UDP[] in pcbconnect ( 
22-9) IP IP PCB bind 
rip input 
251 case PRU CONNECT: Te PE 
252 { 
253 struct sockaddr_in *addr = mtod(nam, struct sockaddr_in *); 
254 if (nam->m len != sizeof(*addr)) { 
255 error = EINVAL; 
256 break; 
257 } 
258 if (ifnet == 0) { 
259 error = EADDRNOTAVAIL; 
260 break; 
261 } 
262 if ((addr->sin family != AF INET) && 
263 (addr->sin_family != AF_IMPLINK)) { 
264 error = EAFNOSUPPORT; 
265 break; 
266 } à : 
267 inp->inp_faddr = addr->sin addr; 
268 soisconnected (so); 
269 break; 


U 32-13 rip usrreq [|] [| [| PRU CONNECT UI 
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shutdown PRU_SHUTDOWN 

IP shutdown 32-14 PRU CONNECT2[]| PRU SHUTDOWN 
271 case PRU CONNECT2: PE 
272 error = EOPNOTSUPP; 
273 break; 
274 /* e 
275 * Mark the connection as being incapable of further input. 
276 */ | 
277 case PRU_SHUTDOWN: 
278 socantsendmore (so) ; 
279 break; s 


E FE ip.c 


0 32-14 PRU_CONNECT2 [] PRU SHUTDOWN [| [J 
















































































































































































































































































































































































































































































271-273 IP PRU_CONNECT2 
274-279 socantsendmore 
23-14 5 pr usrreq PRU SEND 
32-15 
raw ip.c 
280 /* p 
281 * Ship a packet out. The appropriate raw output 
282 * routine handles any massaging necessary. 
283 Ef 
284 case PRU_SEND: 
285 { 
286 u_long dst; 
287 if (80->s0 state & SS ISCONNECTED) ( 
288 if (nam) ( ` 
289 error = EISCONN; 
290 break; 
291 } 
292 f dst = inp->inp_faddr.s_addr; 
293 } else { ` i . 
294 if (nam == NULL) { 
295 error = ENOTCONN; 
296 break; 
297 } 
298 dst = mtod(nam, struct sockaddr_in *)->sin_addr.s_addr; 
299 } 
300 error = rip output (m, so, dst); 
301 m = NULL; 
302 break; 
303 } . 
raw ip.c 
[] 32-15 rip usrreg [] [| [| PRU SEND DD 
280-303 (nam ) 
dst IP 


















































































































































































































































































































































rip_output mbuf| m mbu 
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| ut mbufT[] ([] rip output[]ip output| mbuf[] 
ip output 0000 ) 

32-160 [| [] rip. usrreq | fstat[] [I [] PRU SENSE 
| o [| PRU. SOCKADDR[] PRU_PEERADDR OD getsockname 
getpeername IP| LU U | 
319-324 in setsockaddr[] in_setpeeraddr PCB [] nam 

raw ip.c 
304 case PRU SENSE: p 
305 LE . 
306 * fstat: don’t bother with a blocksize. 
307 */ 
308 return (0); 
309 /* 
310 * Not supported. 
311 Ki 
312 case PRU_RCVOOB: 
313 case PRU_RCVD: 
314 case PRU LISTEN: 
315 case PRU ACCEPT: 
316 case PRU_SENDOOB: 
317 error = EOPNOTSUPP; 
318 break; 
319 case PRU_SOCKADDR: 
320 ; in_setsockaddr (inp, nam); 
321 break; 
322 case PRU_PEERADDR: 2 
323 in_setpeeraddr(inp, nam); 
324 break; 
325 default: 
326 panic("rip_usrreq"); 
327 } 
328 if (m != NULL) 
329 m freem(m); 
330 return (error); 
331 ) 


ia p.c 
[] 32-16 rip usrreq 00000000 


32.8 rip. ctloutput[|[] 
































































































































































































































setsockopt[] get sockopt rip ctloutput[|| IPO | 
| L | | 
32-17 rip ctloutput[] L L 
raw_ip.c 
144 int 
145 rip_ctloutput (op, so, level, optname, m) 
146 int op; 


147 struct socket *so; 


[] 32-17 rip usrreg [O 000 TP BpRINCL OOOO 
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148 int level, optname; 
149 struct mbuf **m; 
150 { - 
151 struct inpcb *inp = sotoinpcb(so); 
152 int error; 
153 if (level !- IPPROTO IP) 
154 return (EINVAL); 
155 switch (optname) { 
156 case IP HDRINCL: - 
157 if (op == PRCO_SETOPT || op == PRCO_GETOPT) { 
158 ' if (m == 0 |] *m == 0 || (*m)->m len < sizeof(int)) 
159 return (EINVAL); 
160 if (op == PRCO_SETOPT) { 
161 if (*mtod(*m, int *)) 
162 inp->inp flags |= INP_HDRINCL; 
163 else 
164 : inp->inp flags &= ^INP HDRINCL; 
165 (void) m-free(*m); 
166 } else { 
167 (*m)->m len = sizeof (int); 
168 *mtod(*m, int *) = inp->inp_flags & INP_HDRINCL; 
169 } 
170 return (0); 
171 } 
172 break; . 
raw D.C 
O 32-17 (LJ) 
144-172 mbuf setsockopt 
mbuf | getsockopt 
mbu 0 switch 
IP 
32-18 rip ctloutput 8 
raw ip.c 
173 case DVMRP INIT: 
174 case DVMRP DONE: 
175 case DVMRP ADD VIF: 
176 case DVMRP DEL VIF: 
177 case DVMRP ADD LGRP: 
178 case DVMRP DEL, LGRP: 
179 case DVMRP ADD MRT: 
180 case DVMRP DEL MRT: 





188 ) 
189 return (ip ctloutput(op, so, level, optname, m)); 
190 } 





raw ip.c 


O 32-18 ripusreq 000000000000 


173-188 8 setsockopt 14-9 
























































































































































85 2 TCP/IP | 
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2 
ip_mrouter_cmd 
189 [] IP | U IP IP_OPTIONS ip ctloutput| 
329 00 
IP 3 
D U t ICMP[] IGMP[] [] 
2) IP 
3) IP 
IP — IP — IP 
IP 
[] IP 3 U U IPH UO U U U 
LU | (1) U (2) 0 IPU O (| connect 030 (3) UL IP ( 
bind 1 30 0 
U U 
32.1 IP HDRINCL socket | 0 
rip_output IP (ip_p) [] socket 
IPPROTO RAW (255)] rip output (ip. p) 
32.2 IPPROTO RAW (255) 
IP 
32.3 0 
IP 
32.4 rip input o nooo 2( ) ICMP 
rip input ICMP[] IGMP 
32.5 TP | IP IP_HDRINCL 
IP BPF([] 310 ) 
32.6 IP BPF 
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o 10 
1.2 SLIP spltty([] 1-13) splimp 
splnet SLIP 
o 20 
2.1 M_EXT mbu mbuf] 
2.2 100 (MHLEN) 
2.3 mbu (2.9) 
( 2.4) 
2.4 <sys/mbuf.h> MCLALLOC|| MCLFREE 
mclrefcnt machdep.c 
O 30 
3.3 
3.4 sl_softc 0 
3.5 
EN on H 
aé 300 
nlen 
alen 
` slen 
DO 0 
1 1 nlen ong 
HO A-1 
U 40 





4.1] leread BPF 
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BPF 
BPF 
ether_input 
4.2 
if else 
U 50 
5.1 looutput 
5.2 BPF 
5.5 SC_ERROR slinput 
SC_ERROR slinput SLIP END 
5.6 IP 
Del ifp le softc 
sc = (struct le softc*) ifp; 
sc 
5.8 ICMP | 
Net/3 UDP 23-30) TCP 
U 60 
6.1 IP (RFC 950 [Mogul[] Postel 19851) [] IP 
in addr 
struct in addr ( 
union ( 
struct { u_char s bl, s b2, s b3, s bá; ) S un b; 
struct { u short s wl, s w2; } S un w; 
u long S addr; 
) S un; 
#define s addr S un.S addr. /* should be used for all code */ 








#define s host S un.S un b.s b2 /* OBSOLETE: host on imp */ 
#define s net S un.S un b.s bi /* OBSOLETE: network */ 
#define s imp S un.S un w.s w2 /* OBSOLETE: imp */ 
#define s impno S un.S un b.s b4 /* OBSOLETE: imp # */ 
#define s lh S un.S un b.s, b3 /* OBSOLETE: logical host */ 
Ji 
H A-2 
Internet 8 bit 16 bit 
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7.1 


O 80 


8.1 
8.4 
8.5 
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TCP/IP 2 
ether_output ifnet 
ifaddr arpcom ( IP ) IP 
ifaddr 
IP UDP 
3 ifa_ifwithnet 
ifaof_ifpforaddr|| rt_maskedcopy 
Telnet Net/2 
inetsw[6] 
pffindproto (PF_INET, 0, SOCK_RAW); 
RFC 1122 
ARP 
TTL 1 TTL 0 1 
255 
ICMP 
TTL 0 TTL 
4 
SLIP 
( 0) ICMP 
0 

RFC 1122 
Net/3 ip_dst 
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9.3 
9.4 IP NOP IP 4 
IP IP 
NOP 4 
9.5 86 399 399(24 x 60x 60x 
1000- 1) 28 bit 32 bit 
9.6 ip dst 
[] 10[] 
10.2 
10.3 (204 + 20) 208([] 2-16) 
10-11 m_pullup 40 mbu 2-18 
mbuf {} mbuf {} 
NULL 
NULL NULL 
NULL 40 184 
NULL 
0 MT pata MT. pata 
NULL MLPRTHDR M EXT 
MT. FTABLE 2⁄4 | Poos 
o pir U ; 
less] den — 
Y NULL 
n0] [uy To 2048 















jum 
20480 00 









































658 TCP/IP 2 China-bubcom 
EE al 



































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































10.5 
72786-349 
es c9 
0 
796 084 _ 
260484 `` 
10.6 10-11 ip off 
MF 
U 110 
11.1 0.0.0.0 
255.255.255.255 
11.2 IP 
IP ICMP 
ICMP ICMP 
11.3 
RFC 1009 
( ) 
11.4 rip input 
11.5 ICMP IP 0 
11.6 ICMP IP ia 
11.7 Neu? 
11.10 0 icmp error 
11.11 icmp send ICMP 
U 120 
12.1 IP 255.255.255.255 ff:ff:ff: ff:ff:ff| 















































































































































IP 
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224.0.0.1 
01:00:5e:00:00:01 IP 
IP 
12.2 ifreg ioctl 
ip_setmoptions|| ip_getmoptions ifunit 
INADDR_TO_IFP ifnet 
12.3 4bit[] [| [| 1110 5 LU | U U 
12.4 ip_moptions mbuf| 
108 ( 20 mbuf )[] IP. MAX MEMBERSHIPS 
25(4+1+1+2+(4x 25)=108) 
12.5 IP 
12.6 
[on | 000 
UU 
Oo A-4 
12.8 IP MAK MEMBERSHIPS 
12.9 mbu m_flags mbu M LOCAL[] ip output 
ipintr 
SunOS 5.X (ip local cksum 10 531] ) 
12.10 2?- 1(8 388 607) IP] [| IP[] 224.0.0.0 
12.11 in_addmulti | ioctl 
if_ioctl in_delmulti 
12.12 mbuf ip_getmoptions 


ip_getmoptions|| ip_ctloutput 


ip getmoptions( 


























O 130 

























































































ip_getmoptions 




































































































































































[P_ADD_MEMBERSHIP, 0, mp) 





ICMP 























































































































































































































132 max_linkhdr + sized$truct ipIGMP_MINLEN=16+20+8=44<100 
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TCP/IP 2 
( ) 
IGMP 
0 [] SLIP | [] 
(U 5-16) 
[] 140 
14.1 50 | A-E 
142 grplst_member ip_mforward 
ip_mforward ipintr ip_output ip_output 
add lgrp 
del Loo splx 
14.3 SIOCDELMULTI U [] IP 
IP 
14.4 
ip_mforward 
[] 150 
15.1 UNIX ([Stevens]) 
15.2 accept sa_len Internet 
OSI 
15.4 so_qlen 0 soqremque sogremque 
15.5 bzero splx 
dom_disposel] sbrealse CPU splimp 
15.6 sbspace 0 sbappendaddr[] sbappendcontrol (U UDP 
TCP[] [| sbappend 
sbspacel] [| OU TCP[] U sbappend 
SS_CANTRCVMORE read 
[] 160 
16.1 uio uio resid sosend 
EINVAL 
Net/2 sosend (O 16-23) 
16.2 MCLBYTES 
MCLBYTES resid 0 394[] break 
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spce>0 
16.5 
16.6 mbu mbuf 
sb cc sb hiwat 
mbu 
16.7 recvitl] recvfrom|]| recvmsg recvmsg 
msghdr Lu Lu 
recvmsg|| namelenp msg namelen 
recvfrom recvit namelenp *namelenp 
16.8 MSG EOR[] soreceive M EOR mbuf 
soreceive 
16.9 select selscan 
select tsleep 
U | | | 
0170 
17.1 copyin[] copyoutl] | mbuf 
uiomove mbu 
17.2 linger 
U 180] 
18.1 8[] | 
[] 1 2 3 1&3 |2 = =4? 142 6&3 
OOO 0000 U D DD U 
1 0 0 0 0 Ë 0 0-0 
2 0 0 1 0 O 0 0-0 
3 0 1 0 0 [ 1 dei 
A 0 1 1 0 O 1 1=[] 
5 1 0 0 0 [] l 0=[] 
6 1 0 l 1 O 1 1=[] 
7 1 1 0 0 O 0 0=[] 
8 1 1 1 1 Ë 0 0=[] 
[] A-5 
“ 2 == A ” “ 6 & 3” 
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TCP/IP 2 
1 
0 0 
18-40 1 
0 
18.2 rtentry 120 radix_node 
sockaddr_in (O 18-28) 152 3 
18.3 rn_b | 16 bit 32767 
bit(4095 ) 
U 190 
19.1 19-15 | RTF_DYNAMIC 
RTF_MODIFIED 
19.2 TCP 
([] 27-3) 
19.3 rt msghdr 76 sockaddr in ( 
) 108 ARP 112 
Sockaddr in Sockaddr dl (15x 112+20x 108)[] 3840 
( ) 8 ( 116 
108 ) 20 4000 
[] 20[] 
20.1 rtm errno (O 20-14) write 
([] 20-22) | mbuf| ( 
20-17) 
20.2 SOCK RAW pffindproto (O 7-20) 0( ) 
[] 210 
21.1 ifnet arpcom (O 3-20) 
21.2 ICMP ARP ICMP 
ARP 
ARP in_arpinput 
21.3 ARP 19-8 rtrequest 
rt_gateway sockaddr_dl 21-1 
sdl_alen 0 
21.4 Net/3 arpresolve 
arplookup rt_gateway ( 
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) 22 TCP 
UDP TCP ( 
IP ) UDP UI 
ARP 0-5 arpresolve ARP 
rt_expire arpresolve 
ether_output EHOSTUNREACH EHOSTDOWN ip_forward 
ICMP | | 
21-28 140.252.13.35 0 
140.252.13.33[] 140.252.13.34 140.252.13.32 rtreguest 
140.252.13.32 arpresolve ARP 
in arpinput ARP 
20 
21-19 arplookup 1( ) 
ARP 500 ms time.tv_sec 
mbuf m_nextpkt 
mbu mbuf 
[Cheswick[] Bellovin 1994] 
udb 0 udb.inp lport[] 0 0 ip pcbbin 
1 1024 1024 
(sa family) AF INET 22-20 
(sa len) 
15-20 sockargs bind 3 
sockaddr_in 16 C[] sizeof 
IP (sin addr) IP 
(sin port) OG E ) 0 
0 TCP[] UDP IP 
0 
bind ifa ifwithaddr([] 22-22) 
IP C.2 RFC 1122 
255.255.255.255 ifa ifwithaddr 




























































































































































































864 wu a: China-bubıcom 
——— =a 


























































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































































[] 231] 
23.1 sosend mbuf 100 
mbu 207[] | mbufl 
100 | sosend[] [| MH ALIGN mbuf| 
udp output M PREPEND 5 
(1) 72 mbuf| IP UDP 
(2) 73 100 sosend mbu 
M PERPEND[] IP[] TCP mbuf[] (3) 101 207 
sosend mbuf[] M PREPEND[] IP[] TCP 
mbufl] (4) 208 MCLBYTES sosend 
mbuf[] M PERPEND[] IP[] TCP mbuf[] (5) 
sosend | mbu IO € 65507 64 
1024 | U mbuf)[] M. PERPEND[] IP[] TCP] [] | mbuf| 
23.2 IP ip_output ip_insertoptions IP 
IP mbu IP IP mbu 
(UDP ) mbu 
ip_insertoptions mbu 100- 28- optlen 
(IP ) mbu IP IP UDP 
20 30 40 5 mbu M_PREPEND IP[] UDP 
M PREPEND M PREPEND MH ALIGN 28 mbuf 
mbu 40 IP 
23.3 in_pcbconnect connect 
UDP 
0 in_pcbconnect ( 
in_pcbbind) 
23.4 splnet 
23.5 in_pcbconnect 0 
connect connect in_pcbconnect 
23.6 ioctl SIOCGIFCONF IP 
ioctl IP | ( 
ioctl[] 19.14 sysctl 
) 
23.7 recvit mbu 
23.8 UDP connect 
0.0.0.0 0 soconnect 
sodisconnect udp_usrreq PRU_DISCONNECT 
0.0.0.0 0 sendto 
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sodisconnect PRU CONNECT 
connect PRU DISCONNECT 
connect API 
disconnect 
connect(2) " 
u connect 
ES " IP 
0.0.0.0 bind 
23.9 in pcbbind | UDP IP 
connect IP 
23.10 IP RECVDSTADDR recvmsg 
IP 
bind 
23.11 ip output([] 8-22) IP DF 
udp_output IP DF 
23.12 udp_input 
[] 24[] 
24.1 ESTABLISHED 126 820 
30 000 
24.2 tcp output IP[] TCP mbuf 
(maz linkhdr) bcopyl] IP[] TCP mbu 
40 mbuf 40 
mbu 
mbu 
24.3 bsdi 16 15 (Telnet 
Rlogin[] FTP ) vangogh.cs.berkeley.edu 20 
60 150 
(world.std.com) 417[] TCP 809[] UDP 
U 250] 
25.1 24-5 2592 000] (300 ) 531 285 ACK 5 
ACK 25 tcp_fasttimo ACK 
TCP ACK 96%(25 24[] ) 
24.3 400 
TCP 5 
ACK 
ACK 


























































































































































































































866 TCP/IP 2 


13-14 igmp_timers_are_running 


25.2 
25.3 


25.4 


25.5 


25.6 


25.7 


U 260 
26.1 
26.2 


26.3 


26.4 


26.5 
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tcp keepintvl 










































































tcp slowtimo tcp maxidle 
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65495 65535 URG 
65535 URG 
65495 
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